diff --git "a/wandb/run-20220315_195757-3ex43zbl/files/output.log" "b/wandb/run-20220315_195757-3ex43zbl/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220315_195757-3ex43zbl/files/output.log" @@ -0,0 +1,6179 @@ + + + 0%| | 0/17840 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:03,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:05,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.6443, 'learning_rate': 3.0000000000000004e-08, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:07,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 1/17840 [00:08<40:55:15, 8.26s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:09,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:11,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:12,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:14,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 2/17840 [00:15<38:18:44, 7.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:16,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.6095, 'learning_rate': 6.000000000000001e-08, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:18,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:20,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:22,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 3/17840 [00:23<37:38:18, 7.60s/it] + + 0%| | 3/17840 [00:23<37:38:18, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:24,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:25,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:27,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.6287, 'learning_rate': 1.2000000000000002e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:29,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 4/17840 [00:30<36:50:39, 7.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:31,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:33,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:34,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.6099, 'learning_rate': 1.5000000000000002e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:36,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 5/17840 [00:37<36:13:27, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:38,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:40,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:41,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.6546, 'learning_rate': 1.8e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:43,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 6/17840 [00:44<35:58:13, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:45,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:47,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:49,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.5845, 'learning_rate': 2.1e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:50,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 7/17840 [00:51<35:43:51, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:52,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:54,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:58:57,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.5811, 'learning_rate': 2.4000000000000003e-07, 'epoch': 0.01} + 0%| | 8/17840 [00:58<35:31:17, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:58:59,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:01,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:03,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.5843, 'learning_rate': 2.7e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:04,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 9/17840 [01:05<35:10:26, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:06,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:08,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.5457, 'learning_rate': 3.0000000000000004e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:10,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:11,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 10/17840 [01:12<34:54:46, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:13,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:15,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:16,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.5463, 'learning_rate': 3.2999999999999996e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:18,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 11/17840 [01:19<34:41:01, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:20,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:22,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:23,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.5246, 'learning_rate': 3.6e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:25,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 12/17840 [01:26<34:29:54, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:27,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:29,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:30,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:32,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 13/17840 [01:33<34:18:04, 6.93s/it] + + 0%| | 13/17840 [01:33<34:18:04, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:34,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:35,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:37,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.503, 'learning_rate': 4.2e-07, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:39,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 14/17840 [01:39<34:04:30, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:40,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:42,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:44,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.4614, 'learning_rate': 4.5e-07, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 15/17840 [01:46<33:50:58, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:47,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:49,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:50,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:52,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 16/17840 [01:53<33:38:52, 6.80s/it] + + 0%| | 16/17840 [01:53<33:38:52, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 19:59:54,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:55,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:57,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 19:59:59,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 17/17840 [02:00<33:27:07, 6.76s/it] + + 0%| | 17/17840 [02:00<33:27:07, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:00,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:02,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:04,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.3846, 'learning_rate': 5.4e-07, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:05,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 18/17840 [02:06<33:12:27, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:07,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:09,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:10,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:12,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 19/17840 [02:13<33:04:35, 6.68s/it] + + 0%| | 19/17840 [02:13<33:04:35, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:14,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:15,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:17,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:18,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 20/17840 [02:19<32:44:53, 6.62s/it] + + 0%| | 20/17840 [02:19<32:44:53, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:20,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:22,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:23,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:25,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 21/17840 [02:26<32:26:44, 6.56s/it] + + 0%| | 21/17840 [02:26<32:26:44, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:27,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:28,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:30,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:31,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 22/17840 [02:32<32:22:08, 6.54s/it] + + 0%| | 22/17840 [02:32<32:22:08, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:33,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:35,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:36,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:38,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 23/17840 [02:39<32:09:39, 6.50s/it] + + 0%| | 23/17840 [02:39<32:09:39, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:39,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:41,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:43,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.2276, 'learning_rate': 7.2e-07, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:44,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 24/17840 [02:45<31:56:29, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:46,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:47,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:49,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:52,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 25/17840 [02:53<33:37:53, 6.80s/it] + 0%| | 25/17840 [02:53<33:37:53, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:00:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:55,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:00:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:58,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:00:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:00:58,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:00:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 26/17840 [02:59<33:01:33, 6.67s/it] + 0%| | 26/17840 [02:59<33:01:33, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:00,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 26/17840 [02:59<33:01:33, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:00,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:05<32:25:38, 6.55s/it]g-point operations will not be computed-15 20:01:00,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:05<32:25:38, 6.55s/it]g-point operations will not be computed-15 20:01:00,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:05<32:25:38, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:06,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:05<32:25:38, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:06,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:09,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:06,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:09,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:06,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:12<32:05:49, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:12,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:12<32:05:49, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:12,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:12<32:05:49, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:12,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:18<31:34:40, 6.38s/it]g-point operations will not be computed-15 20:01:12,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:18<31:34:40, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:18,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:18<31:34:40, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:18,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:18<31:34:40, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:18,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:24<31:17:24, 6.32s/it]g-point operations will not be computed-15 20:01:18,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:24<31:17:24, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:25,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:24<31:17:24, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:25,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:30<31:00:44, 6.27s/it]g-point operations will not be computed-15 20:01:25,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:30<31:00:44, 6.27s/it]g-point operations will not be computed-15 20:01:25,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:30<31:00:44, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:31,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:30<31:00:44, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:31,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:34,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:31,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:34,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:31,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:36<31:19:43, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:37,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:36<31:19:43, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:37,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:42<30:45:32, 6.22s/it]g-point operations will not be computed-15 20:01:37,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:42<30:45:32, 6.22s/it]g-point operations will not be computed-15 20:01:37,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:42<30:45:32, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:43,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:46,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:43,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:46,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:43,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:48<29:54:19, 6.05s/it]g-point operations will not be computed-15 20:01:43,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:48<29:54:19, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:49,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:52,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:49,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:52,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:49,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [03:54<29:31:04, 5.97s/it]g-point operations will not be computed-15 20:01:49,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [03:54<29:31:04, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:01:55,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:57,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:55,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:01:57,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:01:55,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [03:59<28:59:35, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:00,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [03:59<28:59:35, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:00,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:05<28:29:03, 5.76s/it]g-point operations will not be computed-15 20:02:00,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:05<28:29:03, 5.76s/it]g-point operations will not be computed-15 20:02:00,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:05<28:29:03, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:06,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:08,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:06,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:08,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:06,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [04:11<28:16:22, 5.72s/it]g-point operations will not be computed-15 20:02:06,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [04:11<28:16:22, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:11,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:14,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:11,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:14,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:11,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:16<27:27:58, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:16,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:19,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:16,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:19,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:16,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:21<26:44:08, 5.41s/it]g-point operations will not be computed-15 20:02:16,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:21<26:44:08, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:21,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:24,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:21,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:24,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:21,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:26<26:00:10, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:26,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:28,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:26,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:28,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:26,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:30<25:00:31, 5.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:31,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:33,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:31,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:33,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:31,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:35<23:54:11, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:35,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:37,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:35,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:37,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:35,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:39<22:44:01, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:39,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:41,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:39,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:41,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:39,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:42<21:15:13, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:42,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:42<21:15:13, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:42,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:46<19:39:16, 3.98s/it]g-point operations will not be computed-15 20:02:42,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:47,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:46,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:47,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:46,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 47/17840 [04:48<18:03:30, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:48,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 47/17840 [04:48<18:03:30, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:48,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [04:51<16:34:11, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:51,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [04:51<16:34:11, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:51,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 49/17840 [04:53<15:11:06, 3.07s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:53,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:54,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:53,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:02:54,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:53,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:57<15:30:47, 3.14s/it]g-point operations will not be computed-15 20:02:53,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:57<15:30:47, 3.14s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:58,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:57<15:30:47, 3.14s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:02:58,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:02,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:58,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:02,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:02:58,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:04<22:11:27, 4.49s/it]g-point operations will not be computed-15 20:02:58,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:04<22:11:27, 4.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:06,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:09,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:06,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:12<26:23:49, 5.34s/it]g-point operations will not be computed-15 20:03:06,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:12<26:23:49, 5.34s/it]g-point operations will not be computed-15 20:03:06,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:12<26:23:49, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:13,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:12<26:23:49, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:13,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:16,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:13,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:16,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:13,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:19<29:20:10, 5.94s/it]g-point operations will not be computed-15 20:03:13,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:19<29:20:10, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:20,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:24,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:20,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:26<31:06:36, 6.30s/it]g-point operations will not be computed-15 20:03:20,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:26<31:06:36, 6.30s/it]g-point operations will not be computed-15 20:03:20,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:26<31:06:36, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:27,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:26<31:06:36, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:27,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:31,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:27,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:31,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:27,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:33<32:12:34, 6.52s/it]g-point operations will not be computed-15 20:03:27,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:33<32:12:34, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:34,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:38,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:34,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:40<32:58:18, 6.67s/it]g-point operations will not be computed-15 20:03:34,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:40<32:58:18, 6.67s/it]g-point operations will not be computed-15 20:03:34,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:40<32:58:18, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:41,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:40<32:58:18, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:41,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:45,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:41,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:45,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:41,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:47<33:30:31, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:48,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:47<33:30:31, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:48,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:03:52,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:03:48,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<33:48:15, 6.84s/it]g-point operations will not be computed-15 20:03:48,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<33:48:15, 6.84s/it]g-point operations will not be computed-15 20:03:48,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<33:48:15, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:55,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<33:48:15, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:03:55,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<33:54:56, 6.87s/it]g-point operations will not be computed-15 20:03:55,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<33:54:56, 6.87s/it]g-point operations will not be computed-15 20:03:55,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<33:54:56, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:02,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<33:54:56, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:02,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:06,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:02,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:06,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:02,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:08<33:54:06, 6.86s/it]g-point operations will not be computed-15 20:04:02,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:08<33:54:06, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:09,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:12,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:09,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:02:59, 6.89s/it]g-point operations will not be computed-15 20:04:09,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:02:59, 6.89s/it]g-point operations will not be computed-15 20:04:09,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:02:59, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:16,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:02:59, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:16,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:19,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:16,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:19,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:16,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:22<33:59:38, 6.88s/it]g-point operations will not be computed-15 20:04:16,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:22<33:59:38, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:23,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:26,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:23,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:26,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:23,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:29<33:49:42, 6.85s/it]g-point operations will not be computed-15 20:04:23,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:29<33:49:42, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:29<33:49:42, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<33:39:22, 6.82s/it]g-point operations will not be computed-15 20:04:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<33:39:22, 6.82s/it]g-point operations will not be computed-15 20:04:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<33:39:22, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:36,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<33:39:22, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:36,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:40,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:36,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:40,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:36,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:42<33:28:24, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:43,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:42<33:28:24, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:43,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:46,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:43,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:46,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:43,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:49<33:14:46, 6.73s/it]g-point operations will not be computed-15 20:04:43,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:49<33:14:46, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:50,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:04:53,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:50,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:55<33:06:43, 6.71s/it]g-point operations will not be computed-15 20:04:50,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:55<33:06:43, 6.71s/it]g-point operations will not be computed-15 20:04:50,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:55<33:06:43, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:04:56,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:00,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:04:56,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:02<32:59:29, 6.68s/it]g-point operations will not be computed-15 20:04:56,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:02<32:59:29, 6.68s/it]g-point operations will not be computed-15 20:04:56,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:02<32:59:29, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:03,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:02<32:59:29, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:03,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:09<32:49:17, 6.65s/it]g-point operations will not be computed-15 20:05:03,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:09<32:49:17, 6.65s/it]g-point operations will not be computed-15 20:05:03,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:09<32:49:17, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:09,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:09<32:49:17, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:09,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:13,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:09,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:13,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:09,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:15<32:31:12, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:16,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:15<32:31:12, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:16,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:19,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:16,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:19,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:16,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:22<32:26:30, 6.57s/it]g-point operations will not be computed-15 20:05:16,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:22<32:26:30, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:22,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:26,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:22,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:26,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:22,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:28<32:18:19, 6.55s/it]g-point operations will not be computed-15 20:05:22,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:28<32:18:19, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:29,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:32,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:29,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:34<32:04:03, 6.50s/it]g-point operations will not be computed-15 20:05:29,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:34<32:04:03, 6.50s/it]g-point operations will not be computed-15 20:05:29,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:34<32:04:03, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:35,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:38,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:35,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:41<31:53:17, 6.46s/it]g-point operations will not be computed-15 20:05:35,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:41<31:53:17, 6.46s/it]g-point operations will not be computed-15 20:05:35,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:41<31:53:17, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:42,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:41<31:53:17, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:42,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:45,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:42,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:48<33:28:03, 6.78s/it]g-point operations will not be computed-15 20:05:42,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:48<33:28:03, 6.78s/it]g-point operations will not be computed-15 20:05:42,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:48<33:28:03, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:49,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:52,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:49,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:48:32, 6.65s/it]g-point operations will not be computed-15 20:05:49,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:48:32, 6.65s/it]g-point operations will not be computed-15 20:05:49,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:48:32, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:05:55,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:05:59,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:05:55,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:01<32:14:41, 6.54s/it]g-point operations will not be computed-15 20:05:55,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:01<32:14:41, 6.54s/it]g-point operations will not be computed-15 20:05:55,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:01<32:14:41, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:06:02,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:05,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:02,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:07<31:40:04, 6.42s/it]g-point operations will not be computed-15 20:06:02,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:07<31:40:04, 6.42s/it]g-point operations will not be computed-15 20:06:02,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:07<31:40:04, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:06:08,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:11,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:08,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:13<31:11:59, 6.32s/it]g-point operations will not be computed-15 20:06:08,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:13<31:11:59, 6.32s/it]g-point operations will not be computed-15 20:06:08,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:13<31:11:59, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:06:14,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:17,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:14,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:19<30:49:16, 6.25s/it]g-point operations will not be computed-15 20:06:14,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:19<30:49:16, 6.25s/it]g-point operations will not be computed-15 20:06:14,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:19<30:49:16, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:23,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:23,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:25<30:26:52, 6.17s/it]g-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:27,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:27,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:31<30:11:37, 6.12s/it]g-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:31<30:11:37, 6.12s/it]g-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:34,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:34,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [08:37<29:54:34, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [08:37<29:54:34, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1533, 'learning_rate': 2.4900000000000003e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:42,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:42,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.0996, 'learning_rate': 2.52e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:42,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:48,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:48,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1751, 'learning_rate': 2.55e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:52,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 86/17840 [08:54<28:36:07, 5.80s/it]g-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 86/17840 [08:54<28:36:07, 5.80s/it]g-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:56,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:06:56,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:06:38,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 87/17840 [09:00<28:11:52, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 87/17840 [09:00<28:11:52, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1013, 'learning_rate': 2.61e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:04,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:04,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.0572, 'learning_rate': 2.6399999999999997e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:08,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 89/17840 [09:10<27:11:08, 5.51s/it]g-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 89/17840 [09:10<27:11:08, 5.51s/it]g-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:12,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:15,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:15,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:17,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:17,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:17,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 91/17840 [09:20<25:29:25, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:21,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:23,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:21,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 92/17840 [09:25<24:31:02, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:25,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 92/17840 [09:25<24:31:02, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:25,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:27,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:25,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:27,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:25,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 93/17840 [09:29<23:22:34, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:29,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:31,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:29,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:31,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:29,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 94/17840 [09:33<22:10:11, 4.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:33,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:35,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:33,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:35,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:33,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 95/17840 [09:37<21:03:55, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:37,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:38,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:37,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:38,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:37,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 96/17840 [09:40<19:46:25, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:40,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 96/17840 [09:40<19:46:25, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:40,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 97/17840 [09:43<18:16:30, 3.71s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:43,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 97/17840 [09:43<18:16:30, 3.71s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:43,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 98/17840 [09:46<16:46:55, 3.41s/it]g-point operations will not be computed-15 20:07:43,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:47,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:46,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:47,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:46,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:49,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:48,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:49,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:48,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [09:51<15:32:54, 3.16s/it]g-point operations will not be computed-15 20:07:48,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [09:51<15:32:54, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:53,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [09:51<15:32:54, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:07:53,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:56,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:53,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:07:56,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:07:53,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [09:59<22:18:45, 4.53s/it]g-point operations will not be computed-15 20:07:53,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [09:59<22:18:45, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [09:59<22:18:45, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:06,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:06,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1717, 'learning_rate': 3.06e-06, 'epoch': 0.11} +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:09,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:09,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:09,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:14<29:11:43, 5.93s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:14<29:11:43, 5.93s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:14<29:11:43, 5.93s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:14<29:11:43, 5.93s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:14<29:11:43, 5.93s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [10:21<31:06:31, 6.31s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [10:21<31:06:31, 6.31s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:25,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:25,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:28<32:15:30, 6.55s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:28<32:15:30, 6.55s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:28<32:15:30, 6.55s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:28<32:15:30, 6.55s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:28<32:15:30, 6.55s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [10:35<32:54:12, 6.68s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:38,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:38,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:38,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [10:42<33:20:35, 6.77s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [10:42<33:20:35, 6.77s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [10:42<33:20:35, 6.77s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:48,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:48,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.0297, 'learning_rate': 3.24e-06, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:48,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:48,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:08:48,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [10:56<33:49:53, 6.87s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [10:56<33:49:53, 6.87s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:00,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:03<33:46:25, 6.86s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:03<33:46:25, 6.86s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.0273, 'learning_rate': 3.3e-06, 'epoch': 0.12} + 1%|▍ | 110/17840 [11:03<33:46:25, 6.86s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9895, 'learning_rate': 3.3300000000000003e-06, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:16<33:29:46, 6.80s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:16<33:29:46, 6.80s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:20,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 113/17840 [11:23<33:22:00, 6.78s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 113/17840 [11:23<33:22:00, 6.78s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.896, 'learning_rate': 3.39e-06, 'epoch': 0.13} + 1%|▍ | 113/17840 [11:23<33:22:00, 6.78s/it]g-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:29,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:29,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9328, 'learning_rate': 3.4200000000000003e-06, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:29,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:29,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:29,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:08:00,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [11:36<33:12:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [11:36<33:12:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [11:36<33:12:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [11:36<33:12:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 116/17840 [11:43<32:56:52, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:45,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:45,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [11:49<32:47:48, 6.66s/it]g-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [11:49<32:47:48, 6.66s/it]g-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9879, 'learning_rate': 3.5100000000000003e-06, 'epoch': 0.13} + 1%|▍ | 117/17840 [11:49<32:47:48, 6.66s/it]g-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:55,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:55,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9539, 'learning_rate': 3.54e-06, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-15 20:09:55,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:02,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:02,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.922, 'learning_rate': 3.57e-06, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:02,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:02,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:02,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:09:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:09<32:19:23, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:09<32:19:23, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:09<32:19:23, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 121/17840 [12:16<32:11:55, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 121/17840 [12:16<32:11:55, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:18,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:18,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 122/17840 [12:22<32:01:37, 6.51s/it]g-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 122/17840 [12:22<32:01:37, 6.51s/it]g-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:24,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:24,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [12:28<31:50:23, 6.47s/it]g-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [12:28<31:50:23, 6.47s/it]g-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:31,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:31,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:35<31:35:47, 6.42s/it]g-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:35<31:35:47, 6.42s/it]g-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:37,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:37,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:10,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [12:42<33:09:56, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [12:42<33:09:56, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9362, 'learning_rate': 3.75e-06, 'epoch': 0.14} + 1%|▌ | 125/17840 [12:42<33:09:56, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [12:48<32:36:18, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [12:48<32:36:18, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:51,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:51,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [12:55<32:03:43, 6.52s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [12:55<32:03:43, 6.52s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:57,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:10:57,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:01<31:36:29, 6.42s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:01<31:36:29, 6.42s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:03,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:03,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 129/17840 [13:07<31:05:02, 6.32s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 129/17840 [13:07<31:05:02, 6.32s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:09,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:09,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [13:13<30:37:19, 6.22s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [13:13<30:37:19, 6.22s/it]g-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:15,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:15,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:10:43,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:19<30:19:37, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:11:20,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:19<30:19:37, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:11:20,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8689, 'learning_rate': 3.9300000000000005e-06, 'epoch': 0.15} + 1%|▌ | 131/17840 [13:19<30:19:37, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:11:20,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [13:25<30:04:21, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [13:25<30:04:21, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8421, 'learning_rate': 3.96e-06, 'epoch': 0.15} + 1%|▌ | 132/17840 [13:25<30:04:21, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:30,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:30,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:34,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:34,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 134/17840 [13:37<29:09:16, 5.93s/it]g-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 134/17840 [13:37<29:09:16, 5.93s/it]g-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 134/17840 [13:37<29:09:16, 5.93s/it]g-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 134/17840 [13:37<29:09:16, 5.93s/it]g-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:41,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:41,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:46,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:46,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [13:48<28:18:58, 5.76s/it]g-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:50,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:52,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:52,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8156, 'learning_rate': 4.1100000000000005e-06, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:56,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:11:56,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 138/17840 [13:58<27:08:41, 5.52s/it]g-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:00,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.7465, 'learning_rate': 4.170000000000001e-06, 'epoch': 0.16} +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:06,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:06,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:11:26,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 140/17840 [14:08<25:39:08, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 140/17840 [14:08<25:39:08, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 140/17840 [14:08<25:39:08, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:12,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:14,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:14,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:16,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:18,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:18,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:20,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:22,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:22,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:24,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:27,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:27,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:29,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:29,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:30,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:33,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:33,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:35,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:35,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:37,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:37,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:38,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:39,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:39,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:42,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:45,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:45,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:49,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:49,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8296, 'learning_rate': 4.53e-06, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:53,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:53,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:53,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:12:56,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:00,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:00,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 153/17840 [15:04<28:24:37, 5.78s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 153/17840 [15:04<28:24:37, 5.78s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.7365, 'learning_rate': 4.59e-06, 'epoch': 0.17} + 1%|▋ | 153/17840 [15:04<28:24:37, 5.78s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 153/17840 [15:04<28:24:37, 5.78s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 153/17840 [15:04<28:24:37, 5.78s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:11<30:21:29, 6.18s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:14,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:14,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [15:18<31:53:29, 6.49s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [15:18<31:53:29, 6.49s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.6983, 'learning_rate': 4.65e-06, 'epoch': 0.17} + 1%|▋ | 155/17840 [15:18<31:53:29, 6.49s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [15:18<31:53:29, 6.49s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [15:18<31:53:29, 6.49s/it]g-point operations will not be computed-15 20:12:09,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:25<32:36:56, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:25<32:36:56, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:25<32:36:56, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [15:32<33:02:40, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [15:32<33:02:40, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.7459, 'learning_rate': 4.71e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:37,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [15:39<33:23:51, 6.80s/it]g-point operations will not be computed-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [15:39<33:23:51, 6.80s/it]g-point operations will not be computed-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.7497, 'learning_rate': 4.74e-06, 'epoch': 0.18} + 1%|▋ | 158/17840 [15:39<33:23:51, 6.80s/it]g-point operations will not be computed-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [15:39<33:23:51, 6.80s/it]g-point operations will not be computed-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [15:39<33:23:51, 6.80s/it]g-point operations will not be computed-15 20:13:26,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [15:46<33:33:03, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [15:46<33:33:03, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [15:46<33:33:03, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [15:53<33:39:46, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [15:53<33:39:46, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.7082, 'learning_rate': 4.800000000000001e-06, 'epoch': 0.18} + 1%|▋ | 160/17840 [15:53<33:39:46, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:59,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:59,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.5745, 'learning_rate': 4.83e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:59,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:13:59,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:07<33:18:39, 6.78s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:07<33:18:39, 6.78s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:09,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:09,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:13<33:11:33, 6.76s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:13<33:11:33, 6.76s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.6412, 'learning_rate': 4.890000000000001e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:18,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:18,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:06:53, 6.74s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:06:53, 6.74s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:06:53, 6.74s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:06:53, 6.74s/it]g-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:26,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:26,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:26,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:26,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:26,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:13:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [16:33<32:51:15, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [16:33<32:51:15, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [16:33<32:51:15, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [16:33<32:51:15, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [16:40<32:38:31, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:42,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:42,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:42,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [16:46<32:26:47, 6.61s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [16:46<32:26:47, 6.61s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:50,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:50,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 169/17840 [16:53<32:21:46, 6.59s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 169/17840 [16:53<32:21:46, 6.59s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:14:57,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [16:59<32:13:01, 6.56s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [16:59<32:13:01, 6.56s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.5221, 'learning_rate': 5.1e-06, 'epoch': 0.19} + 1%|▋ | 170/17840 [16:59<32:13:01, 6.56s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [16:59<32:13:01, 6.56s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [16:59<32:13:01, 6.56s/it]g-point operations will not be computed-15 20:14:34,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:06<32:03:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:07,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:06<32:03:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:07,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:06<32:03:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:07,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:06<32:03:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:07,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:12<31:54:18, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:13,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:12<31:54:18, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:13,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:12<31:54:18, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:13,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:12<31:54:18, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:13,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:19<31:36:52, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:19<31:36:52, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:19<31:36:52, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:19<31:36:52, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [17:25<31:28:15, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:27,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:27,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<33:00:33, 6.73s/it]g-point operations will not be computed-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<33:00:33, 6.73s/it]g-point operations will not be computed-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4849, 'learning_rate': 5.25e-06, 'epoch': 0.2} + 1%|▋ | 175/17840 [17:32<33:00:33, 6.73s/it]g-point operations will not be computed-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<33:00:33, 6.73s/it]g-point operations will not be computed-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<33:00:33, 6.73s/it]g-point operations will not be computed-15 20:15:19,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [17:39<32:24:17, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [17:39<32:24:17, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:44,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:44,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.5221, 'learning_rate': 5.31e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:44,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:50,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:50,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4784, 'learning_rate': 5.34e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:50,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:56,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:56,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.5325, 'learning_rate': 5.37e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-15 20:15:56,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:02,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:02,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4689, 'learning_rate': 5.4e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:02,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:08,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:08,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4975, 'learning_rate': 5.43e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:12,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [18:15<29:32:31, 6.02s/it]g-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [18:15<29:32:31, 6.02s/it]g-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:17,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:17,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 183/17840 [18:20<29:10:07, 5.95s/it]g-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 183/17840 [18:20<29:10:07, 5.95s/it]g-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:23,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:23,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:23,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 184/17840 [18:26<28:46:19, 5.87s/it]g-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:28,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:28,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:28,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:15:39,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [18:32<28:21:42, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [18:32<28:21:42, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:36,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:36,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4913, 'learning_rate': 5.58e-06, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:40,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:40,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 187/17840 [18:42<27:21:03, 5.58s/it]g-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:44,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:47,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:47,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.3785, 'learning_rate': 5.64e-06, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:51,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 189/17840 [18:53<26:22:14, 5.38s/it]g-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 189/17840 [18:53<26:22:14, 5.38s/it]g-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:55,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:57,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:16:57,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.399, 'learning_rate': 5.7000000000000005e-06, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:01,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:01,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:16:32,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 191/17840 [19:03<25:09:43, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:03,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:05,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:03,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 192/17840 [19:07<24:14:38, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 192/17840 [19:07<24:14:38, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:10,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 193/17840 [19:12<23:14:15, 4.74s/it]g-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 193/17840 [19:12<23:14:15, 4.74s/it]g-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:13,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:15,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:15,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:16,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:16,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:18,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:22,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:22,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:23,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:26,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:26,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:27,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:27,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:29,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:29,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:31,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:33,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:33,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8606, 'learning_rate': 6e-06, 'epoch': 0.22} +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:36,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:36,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:36,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:40,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:44,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:44,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:47,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:47,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.6103, 'learning_rate': 6.0600000000000004e-06, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:47,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:47,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:17:47,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:17:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 203/17840 [19:55<28:39:52, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 203/17840 [19:55<28:39:52, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 203/17840 [19:55<28:39:52, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:02<30:23:58, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:02<30:23:58, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4199, 'learning_rate': 6.12e-06, 'epoch': 0.23} + 1%|▊ | 204/17840 [20:02<30:23:58, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:02<30:23:58, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:02<30:23:58, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:17:56,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [20:09<31:33:34, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [20:09<31:33:34, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [20:09<31:33:34, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [20:16<32:23:26, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [20:16<32:23:26, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.3683, 'learning_rate': 6.18e-06, 'epoch': 0.23} + 1%|▉ | 206/17840 [20:16<32:23:26, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:18:23,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:18:23,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.3817, 'learning_rate': 6.21e-06, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-15 20:18:23,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:18:23,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 208/17840 [20:30<33:10:20, 6.77s/it]g-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 208/17840 [20:30<33:10:20, 6.77s/it]g-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.257, 'learning_rate': 6.2399999999999995e-06, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-15 20:18:35,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:11:28, 6.78s/it]g-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:11:28, 6.78s/it]g-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2768, 'learning_rate': 6.27e-06, 'epoch': 0.23} + 1%|▉ | 209/17840 [20:37<33:11:28, 6.78s/it]g-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:11:28, 6.78s/it]g-point operations will not be computed-15 20:18:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [20:44<33:18:52, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [20:44<33:18:52, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.3013, 'learning_rate': 6.3e-06, 'epoch': 0.24} + 1%|▉ | 210/17840 [20:44<33:18:52, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [20:51<33:21:02, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [20:51<33:21:02, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:18:53,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:18:53,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 212/17840 [20:58<33:16:37, 6.80s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 212/17840 [20:58<33:16:37, 6.80s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2259, 'learning_rate': 6.36e-06, 'epoch': 0.24} + 1%|▉ | 212/17840 [20:58<33:16:37, 6.80s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 212/17840 [20:58<33:16:37, 6.80s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:03,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:03,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:03,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:03,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:03,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [21:11<32:59:29, 6.74s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:13,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:13,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:13,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [21:18<32:49:39, 6.71s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [21:18<32:49:39, 6.71s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:22,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:22,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [21:24<32:42:27, 6.68s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [21:24<32:42:27, 6.68s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [21:24<32:42:27, 6.68s/it]g-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:30,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:30,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2361, 'learning_rate': 6.51e-06, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:30,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:30,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:30,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:18:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [21:37<32:23:58, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [21:37<32:23:58, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [21:37<32:23:58, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [21:37<32:23:58, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 219/17840 [21:44<32:12:03, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:46,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:46,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:46,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [21:50<32:06:15, 6.56s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [21:50<32:06:15, 6.56s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:54,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:19:54,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [21:57<32:03:24, 6.55s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [21:57<32:03:24, 6.55s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [21:57<32:03:24, 6.55s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [21:57<32:03:24, 6.55s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:02,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:02,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:02,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:09,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:09,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2667, 'learning_rate': 6.69e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:09,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:15,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:15,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2641, 'learning_rate': 6.72e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:15,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:15,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [22:24<33:13:33, 6.79s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [22:24<33:13:33, 6.79s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2109, 'learning_rate': 6.750000000000001e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:28,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [22:30<32:32:51, 6.65s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [22:30<32:32:51, 6.65s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2471, 'learning_rate': 6.78e-06, 'epoch': 0.25} + 1%|▉ | 226/17840 [22:30<32:32:51, 6.65s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:35,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:35,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1764, 'learning_rate': 6.81e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:35,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:41,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:41,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1589, 'learning_rate': 6.840000000000001e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:41,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:47,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:47,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.155, 'learning_rate': 6.87e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 230/17840 [22:54<30:16:25, 6.19s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 230/17840 [22:54<30:16:25, 6.19s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1549, 'learning_rate': 6.900000000000001e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:58,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:20:58,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 231/17840 [23:00<29:57:19, 6.12s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 231/17840 [23:00<29:57:19, 6.12s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:04,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:04,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 232/17840 [23:06<29:35:38, 6.05s/it]g-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:08,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:08,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:08,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:19:38,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [23:12<29:08:39, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [23:12<29:08:39, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:17,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:17,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1341, 'learning_rate': 7.0200000000000006e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:17,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:22,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:22,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.2255, 'learning_rate': 7.049999999999999e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:26,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 236/17840 [23:29<27:55:18, 5.71s/it]g-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 236/17840 [23:29<27:55:18, 5.71s/it]g-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:31,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:33,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:33,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1129, 'learning_rate': 7.11e-06, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:37,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 238/17840 [23:39<26:59:28, 5.52s/it]g-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 238/17840 [23:39<26:59:28, 5.52s/it]g-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:41,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:41,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:41,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:13,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 239/17840 [23:45<26:28:28, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:21:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 239/17840 [23:45<26:28:28, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:21:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:49,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:49,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:51,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:51,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:51,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 241/17840 [23:54<25:07:15, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:21:55,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:57,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:55,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:21:57,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:55,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 242/17840 [23:59<24:04:12, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:21:59,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:01,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:21:59,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 243/17840 [24:03<22:56:42, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:03,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 243/17840 [24:03<22:56:42, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:03,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:05,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:03,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:05,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:03,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 244/17840 [24:07<21:40:25, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:07,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 245/17840 [24:10<20:24:42, 4.18s/it]g-point operations will not be computed-15 20:22:07,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 245/17840 [24:10<20:24:42, 4.18s/it]g-point operations will not be computed-15 20:22:07,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 245/17840 [24:10<20:24:42, 4.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:10,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 246/17840 [24:14<19:04:31, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:14,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 246/17840 [24:14<19:04:31, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:14,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 247/17840 [24:16<17:38:19, 3.61s/it]g-point operations will not be computed-15 20:22:14,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 247/17840 [24:16<17:38:19, 3.61s/it]g-point operations will not be computed-15 20:22:14,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:18,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:16,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 248/17840 [24:19<16:10:07, 3.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:19,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 248/17840 [24:19<16:10:07, 3.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:19,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 249/17840 [24:21<14:47:36, 3.03s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:21,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 249/17840 [24:21<14:47:36, 3.03s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:21,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 250/17840 [24:25<15:13:49, 3.12s/it]g-point operations will not be computed-15 20:22:21,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 250/17840 [24:25<15:13:49, 3.12s/it]g-point operations will not be computed-15 20:22:21,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4951, 'learning_rate': 7.5e-06, 'epoch': 0.28} + 1%|█ | 250/17840 [24:25<15:13:49, 3.12s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:26,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:26,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 251/17840 [24:32<21:53:41, 4.48s/it]g-point operations will not be computed-15 20:22:26,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 251/17840 [24:32<21:53:41, 4.48s/it]g-point operations will not be computed-15 20:22:26,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 251/17840 [24:32<21:53:41, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 251/17840 [24:32<21:53:41, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:37,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [24:40<25:57:56, 5.31s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [24:40<25:57:56, 5.31s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:43,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:43,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [24:47<28:41:45, 5.87s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [24:47<28:41:45, 5.87s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.0787, 'learning_rate': 7.59e-06, 'epoch': 0.28} + 1%|█ | 253/17840 [24:47<28:41:45, 5.87s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [24:47<28:41:45, 5.87s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [24:54<30:34:25, 6.26s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [24:54<30:34:25, 6.26s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1609, 'learning_rate': 7.62e-06, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:59,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:22:59,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [25:01<31:51:24, 6.52s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [25:01<31:51:24, 6.52s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [25:01<31:51:24, 6.52s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [25:01<31:51:24, 6.52s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [25:01<31:51:24, 6.52s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [25:08<32:38:09, 6.68s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:15<33:11:34, 6.80s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:15<33:11:34, 6.80s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:15<33:11:34, 6.80s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:15<33:11:34, 6.80s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:15<33:11:34, 6.80s/it]g-point operations will not be computed-15 20:22:34,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 258/17840 [25:22<33:32:30, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 258/17840 [25:22<33:32:30, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 258/17840 [25:22<33:32:30, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 258/17840 [25:22<33:32:30, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [25:29<33:34:40, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [25:29<33:34:40, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:34,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [25:36<33:37:36, 6.89s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [25:36<33:37:36, 6.89s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.9764, 'learning_rate': 7.8e-06, 'epoch': 0.29} + 1%|█ | 260/17840 [25:36<33:37:36, 6.89s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [25:36<33:37:36, 6.89s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [25:36<33:37:36, 6.89s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 261/17840 [25:43<33:34:06, 6.87s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:46,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:46,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:46,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [25:50<33:25:53, 6.85s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [25:50<33:25:53, 6.85s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [25:50<33:25:53, 6.85s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [25:50<33:25:53, 6.85s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:56,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:56,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:23:56,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:02,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:02,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.0011, 'learning_rate': 7.92e-06, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:02,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:02,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:02,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [26:10<33:01:12, 6.76s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [26:10<33:01:12, 6.76s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:14,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [26:17<33:05:22, 6.78s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [26:17<33:05:22, 6.78s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.9807, 'learning_rate': 7.98e-06, 'epoch': 0.3} + 1%|█▏ | 266/17840 [26:17<33:05:22, 6.78s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [26:17<33:05:22, 6.78s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [26:17<33:05:22, 6.78s/it]g-point operations will not be computed-15 20:23:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [26:23<32:50:35, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [26:23<32:50:35, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [26:23<32:50:35, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [26:23<32:50:35, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [26:30<32:47:21, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:33,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:33,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:33,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [26:37<32:38:24, 6.69s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [26:37<32:38:24, 6.69s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:41,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 270/17840 [26:43<32:34:06, 6.67s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 270/17840 [26:43<32:34:06, 6.67s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8994, 'learning_rate': 8.1e-06, 'epoch': 0.3} + 2%|█▏ | 270/17840 [26:43<32:34:06, 6.67s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:49,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:49,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.84, 'learning_rate': 8.13e-06, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:49,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:49,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:49,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [26:56<32:19:25, 6.62s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:59,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:59,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:24:59,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 273/17840 [27:03<32:06:25, 6.58s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 273/17840 [27:03<32:06:25, 6.58s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:07,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [27:09<32:00:41, 6.56s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [27:09<32:00:41, 6.56s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7049, 'learning_rate': 8.220000000000001e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:13,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:13,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [27:17<33:44:50, 6.92s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [27:17<33:44:50, 6.92s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:21,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 276/17840 [27:24<33:03:04, 6.77s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 276/17840 [27:24<33:03:04, 6.77s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7744, 'learning_rate': 8.28e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:27,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 277/17840 [27:30<32:13:34, 6.61s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 277/17840 [27:30<32:13:34, 6.61s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6969, 'learning_rate': 8.310000000000002e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:34,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [27:36<31:34:33, 6.47s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [27:36<31:34:33, 6.47s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8058, 'learning_rate': 8.340000000000001e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 279/17840 [27:42<31:08:34, 6.38s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 279/17840 [27:42<31:08:34, 6.38s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7993, 'learning_rate': 8.370000000000001e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:46,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [27:48<30:44:36, 6.30s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [27:48<30:44:36, 6.30s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:51,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:51,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [27:54<30:30:06, 6.25s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [27:54<30:30:06, 6.25s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6926, 'learning_rate': 8.43e-06, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-15 20:25:58,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [28:00<30:00:55, 6.15s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [28:00<30:00:55, 6.15s/it]g-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:03,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:03,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:24:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 283/17840 [28:06<29:38:25, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:07,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 283/17840 [28:06<29:38:25, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:07,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6298, 'learning_rate': 8.49e-06, 'epoch': 0.32} + 2%|█▏ | 283/17840 [28:06<29:38:25, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:07,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 283/17840 [28:06<29:38:25, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:07,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [28:12<29:01:50, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [28:12<29:01:50, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:17,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:17,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7349, 'learning_rate': 8.55e-06, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:21,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 286/17840 [28:23<28:01:52, 5.75s/it]g-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 286/17840 [28:23<28:01:52, 5.75s/it]g-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:25,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:25,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:25,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:13,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [28:28<27:25:44, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [28:28<27:25:44, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:33,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:33,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.701, 'learning_rate': 8.64e-06, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:37,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 289/17840 [28:39<26:12:32, 5.38s/it]g-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 289/17840 [28:39<26:12:32, 5.38s/it]g-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:40,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:43,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:43,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:45,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:47,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:47,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7837, 'learning_rate': 8.73e-06, 'epoch': 0.33} +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:51,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:51,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 292/17840 [28:53<23:31:46, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:53,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:55,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:53,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:26:55,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:26:53,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 293/17840 [28:57<22:30:10, 4.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:26:57,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [29:00<21:17:43, 4.37s/it]g-point operations will not be computed-15 20:26:57,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [29:00<21:17:43, 4.37s/it]g-point operations will not be computed-15 20:26:57,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [29:00<21:17:43, 4.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:01,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 295/17840 [29:04<20:06:36, 4.13s/it]g-point operations will not be computed-15 20:27:01,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 295/17840 [29:04<20:06:36, 4.13s/it]g-point operations will not be computed-15 20:27:01,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:06,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:04,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 296/17840 [29:07<18:44:20, 3.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:07,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 296/17840 [29:07<18:44:20, 3.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:07,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 297/17840 [29:10<17:14:55, 3.54s/it]g-point operations will not be computed-15 20:27:07,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 297/17840 [29:10<17:14:55, 3.54s/it]g-point operations will not be computed-15 20:27:07,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 298/17840 [29:13<15:49:39, 3.25s/it]g-point operations will not be computed-15 20:27:10,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 298/17840 [29:13<15:49:39, 3.25s/it]g-point operations will not be computed-15 20:27:10,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:13,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:12,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:16,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:15,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:16,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:15,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:18<14:41:00, 3.01s/it]g-point operations will not be computed-15 20:27:15,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:18<14:41:00, 3.01s/it]g-point operations will not be computed-15 20:27:15,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:18<14:41:00, 3.01s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:19,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:18<14:41:00, 3.01s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:19,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:23,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:19,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:23,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:19,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [29:26<21:22:03, 4.39s/it]g-point operations will not be computed-15 20:27:19,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [29:26<21:22:03, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:27,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [29:26<21:22:03, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:27,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:33<25:29:57, 5.23s/it]g-point operations will not be computed-15 20:27:27,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:33<25:29:57, 5.23s/it]g-point operations will not be computed-15 20:27:27,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:33<25:29:57, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:33<25:29:57, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:33<25:29:57, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:33<25:29:57, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [29:40<28:27:21, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [29:40<28:27:21, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:45,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [29:47<30:22:22, 6.24s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [29:47<30:22:22, 6.24s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.842, 'learning_rate': 9.12e-06, 'epoch': 0.34} + 2%|█▎ | 304/17840 [29:47<30:22:22, 6.24s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [29:47<30:22:22, 6.24s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [29:47<30:22:22, 6.24s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [29:54<31:40:12, 6.50s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [29:54<31:40:12, 6.50s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:27:59,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [30:01<32:24:44, 6.65s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [30:01<32:24:44, 6.65s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6835, 'learning_rate': 9.18e-06, 'epoch': 0.34} + 2%|█▎ | 306/17840 [30:01<32:24:44, 6.65s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [30:01<32:24:44, 6.65s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [30:01<32:24:44, 6.65s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [30:08<32:54:58, 6.76s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:11,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:11,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:11,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [30:15<33:10:27, 6.81s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [30:15<33:10:27, 6.81s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [30:15<33:10:27, 6.81s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [30:15<33:10:27, 6.81s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [30:15<33:10:27, 6.81s/it]g-point operations will not be computed-15 20:27:34,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:22<33:20:55, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:22<33:20:55, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:22<33:20:55, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:22<33:20:55, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [30:29<33:25:01, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [30:29<33:25:01, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:33,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [30:36<33:15:36, 6.83s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [30:36<33:15:36, 6.83s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6919, 'learning_rate': 9.33e-06, 'epoch': 0.35} + 2%|█▎ | 311/17840 [30:36<33:15:36, 6.83s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:42,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:42,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6879, 'learning_rate': 9.36e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:42,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:42,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:42,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [30:49<32:58:26, 6.77s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:52,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:52,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:28:52,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [30:56<32:48:47, 6.74s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [30:56<32:48:47, 6.74s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:00,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [31:03<32:48:07, 6.74s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [31:03<32:48:07, 6.74s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5183, 'learning_rate': 9.450000000000001e-06, 'epoch': 0.35} + 2%|█▎ | 315/17840 [31:03<32:48:07, 6.74s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:09,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:09,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6105, 'learning_rate': 9.48e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:09,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:09,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:09,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 317/17840 [31:16<32:24:05, 6.66s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:18,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:18,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:18,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [31:22<32:09:30, 6.61s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:25,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:25,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [31:29<32:03:05, 6.59s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [31:29<32:03:05, 6.59s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4527, 'learning_rate': 9.57e-06, 'epoch': 0.36} + 2%|█▎ | 319/17840 [31:29<32:03:05, 6.59s/it]g-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:35,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:35,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6032, 'learning_rate': 9.600000000000001e-06, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:35,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:41,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:41,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5337, 'learning_rate': 9.630000000000001e-06, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:41,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:41,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:41,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:28:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 322/17840 [31:48<31:33:32, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 322/17840 [31:48<31:33:32, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 322/17840 [31:48<31:33:32, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 322/17840 [31:48<31:33:32, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 323/17840 [31:55<31:28:03, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:57,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:57,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:29:57,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [32:01<31:19:25, 6.44s/it]g-point operations will not be computed-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:03,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:03,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:03,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:29:49,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [32:09<33:11:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [32:09<33:11:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [32:09<33:11:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [32:09<33:11:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 326/17840 [32:15<32:30:52, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:18,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:18,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:18,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:10,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [32:21<31:59:53, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:22,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [32:21<31:59:53, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:22,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [32:21<31:59:53, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:22,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [32:21<31:59:53, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:22,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [32:28<31:18:01, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [32:28<31:18:01, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [32:28<31:18:01, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [32:28<31:18:01, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [32:34<30:53:42, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:36,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:36,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:36,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 330/17840 [32:40<30:25:11, 6.25s/it]g-point operations will not be computed-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:42,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:42,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:42,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [32:46<30:04:25, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [32:46<30:04:25, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:51,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:51,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2791, 'learning_rate': 9.960000000000001e-06, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:51,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:57,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:30:57,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4651, 'learning_rate': 9.990000000000001e-06, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:01,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 334/17840 [33:03<28:49:41, 5.93s/it]g-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 334/17840 [33:03<28:49:41, 5.93s/it]g-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4506, 'learning_rate': 1.002e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:07,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 335/17840 [33:09<28:21:10, 5.83s/it]g-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 335/17840 [33:09<28:21:10, 5.83s/it]g-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:11,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:11,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:30:46,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [33:14<28:00:45, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [33:14<28:00:45, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3507, 'learning_rate': 1.008e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:19,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:19,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.317, 'learning_rate': 1.0110000000000001e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:23,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 338/17840 [33:25<27:04:17, 5.57s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 338/17840 [33:25<27:04:17, 5.57s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:27,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:29,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:29,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4921, 'learning_rate': 1.0170000000000001e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:33,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 340/17840 [33:35<25:36:31, 5.27s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 340/17840 [33:35<25:36:31, 5.27s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:37,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:39,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:39,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:41,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:43,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:43,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:46,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:48,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:48,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:50,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:52,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:52,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:53,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:55,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:55,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:31:57,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:00,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:00,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:01,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:01,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:04,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:04,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:05,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:07,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:07,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:09,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:09,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9771, 'learning_rate': 1.05e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:13,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:13,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:17,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:17,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4278, 'learning_rate': 1.0529999999999999e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:21,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:21,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 352/17840 [34:25<25:46:27, 5.31s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 352/17840 [34:25<25:46:27, 5.31s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:28,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:28,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:28,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [34:32<28:31:37, 5.87s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [34:32<28:31:37, 5.87s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [34:32<28:31:37, 5.87s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [34:32<28:31:37, 5.87s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [34:40<30:23:42, 6.26s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [34:40<30:23:42, 6.26s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4202, 'learning_rate': 1.062e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:44,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:32:44,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [34:47<31:36:54, 6.51s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [34:47<31:36:54, 6.51s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [34:47<31:36:54, 6.51s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [34:47<31:36:54, 6.51s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [34:47<31:36:54, 6.51s/it]g-point operations will not be computed-15 20:31:15,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [34:54<32:20:24, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [34:54<32:20:24, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [34:54<32:20:24, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [34:54<32:20:24, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [35:01<32:52:38, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [35:01<32:52:38, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:05,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:08<33:07:14, 6.82s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:08<33:07:14, 6.82s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3198, 'learning_rate': 1.074e-05, 'epoch': 0.4} + 2%|█▌ | 358/17840 [35:08<33:07:14, 6.82s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:08<33:07:14, 6.82s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:08<33:07:14, 6.82s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [35:15<33:16:19, 6.85s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [35:15<33:16:19, 6.85s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:19,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:19,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:21<33:12:57, 6.84s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:21<33:12:57, 6.84s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:21<33:12:57, 6.84s/it]g-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:27,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:27,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2784, 'learning_rate': 1.083e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:27,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:27,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:27,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:32:55,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:35<33:05:01, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:35<33:05:01, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:35<33:05:01, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:35<33:05:01, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 363/17840 [35:42<32:58:05, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 363/17840 [35:42<32:58:05, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:33:46,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [35:48<32:52:53, 6.77s/it]g-point operations will not be computed-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [35:48<32:52:53, 6.77s/it]g-point operations will not be computed-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.324, 'learning_rate': 1.092e-05, 'epoch': 0.41} + 2%|█▌ | 364/17840 [35:48<32:52:53, 6.77s/it]g-point operations will not be computed-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [35:48<32:52:53, 6.77s/it]g-point operations will not be computed-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [35:48<32:52:53, 6.77s/it]g-point operations will not be computed-15 20:33:36,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [35:55<32:42:20, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [35:55<32:42:20, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [35:55<32:42:20, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [35:55<32:42:20, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [36:02<32:38:02, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [36:02<32:38:02, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:06,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [36:09<32:34:17, 6.71s/it]g-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [36:09<32:34:17, 6.71s/it]g-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2495, 'learning_rate': 1.101e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:13,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [36:15<32:24:57, 6.68s/it]g-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [36:15<32:24:57, 6.68s/it]g-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2139, 'learning_rate': 1.104e-05, 'epoch': 0.41} + 2%|█▌ | 368/17840 [36:15<32:24:57, 6.68s/it]g-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [36:15<32:24:57, 6.68s/it]g-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [36:15<32:24:57, 6.68s/it]g-point operations will not be computed-15 20:33:56,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [36:22<32:19:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [36:22<32:19:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [36:22<32:19:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [36:22<32:19:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [36:28<31:59:12, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:31,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:31,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:31,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [36:35<31:50:45, 6.56s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [36:35<31:50:45, 6.56s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:39,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [36:41<31:40:40, 6.53s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [36:41<31:40:40, 6.53s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.399, 'learning_rate': 1.116e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:45,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [36:48<31:30:05, 6.49s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [36:48<31:30:05, 6.49s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2489, 'learning_rate': 1.119e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:51,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [36:54<31:14:31, 6.44s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [36:54<31:14:31, 6.44s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3441, 'learning_rate': 1.1220000000000001e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-15 20:34:58,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [37:01<32:46:59, 6.76s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [37:01<32:46:59, 6.76s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1515, 'learning_rate': 1.125e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:05,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [37:08<32:22:23, 6.67s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [37:08<32:22:23, 6.67s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2581, 'learning_rate': 1.128e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:12,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 377/17840 [37:14<31:38:03, 6.52s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 377/17840 [37:14<31:38:03, 6.52s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1427, 'learning_rate': 1.131e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:18,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [37:20<31:07:32, 6.42s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [37:20<31:07:32, 6.42s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1896, 'learning_rate': 1.134e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:24,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 379/17840 [37:26<30:41:37, 6.33s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 379/17840 [37:26<30:41:37, 6.33s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:29,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:29,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 380/17840 [37:32<30:15:57, 6.24s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 380/17840 [37:32<30:15:57, 6.24s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2508, 'learning_rate': 1.1400000000000001e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:36,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [37:38<29:55:23, 6.17s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [37:38<29:55:23, 6.17s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:41,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:41,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 382/17840 [37:44<29:34:22, 6.10s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 382/17840 [37:44<29:34:22, 6.10s/it]g-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:46,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:46,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:46,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:34:23,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 383/17840 [37:50<29:13:51, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 383/17840 [37:50<29:13:51, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:55,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:55,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2551, 'learning_rate': 1.152e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-15 20:35:55,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:01,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:01,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1458, 'learning_rate': 1.1550000000000001e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:05,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 386/17840 [38:07<27:56:46, 5.76s/it]g-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 386/17840 [38:07<27:56:46, 5.76s/it]g-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:09,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:12,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:12,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:12,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:16,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 388/17840 [38:18<26:55:09, 5.55s/it]g-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 388/17840 [38:18<26:55:09, 5.55s/it]g-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:20,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:20,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:35:51,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 389/17840 [38:23<26:16:07, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 389/17840 [38:23<26:16:07, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1289, 'learning_rate': 1.167e-05, 'epoch': 0.44} +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:27,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:27,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:29,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:32,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:32,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:34,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:36,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:36,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:36,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:40,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:40,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:23,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 393/17840 [38:41<23:06:07, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:42,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:44,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:42,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:44,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:42,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 394/17840 [38:46<22:05:57, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:46,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:48,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:46,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:36:48,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:36:46,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 395/17840 [38:49<20:58:35, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:49,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 396/17840 [38:53<19:38:00, 4.05s/it]g-point operations will not be computed-15 20:36:49,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 396/17840 [38:53<19:38:00, 4.05s/it]g-point operations will not be computed-15 20:36:49,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 396/17840 [38:53<19:38:00, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:53,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 397/17840 [38:56<18:11:01, 3.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:56,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 397/17840 [38:56<18:11:01, 3.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:56,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 398/17840 [38:58<16:28:11, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:58,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 398/17840 [38:58<16:28:11, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:36:58,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9958, 'learning_rate': 1.1940000000000001e-05, 'epoch': 0.45} + 2%|█▋ | 399/17840 [39:01<14:56:48, 3.09s/it]g-point operations will not be computed-15 20:36:58,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:02,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:01,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:02,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:01,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [39:04<15:18:02, 3.16s/it]g-point operations will not be computed-15 20:37:01,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [39:04<15:18:02, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:05,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [39:04<15:18:02, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:05,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:09,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:05,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:09,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:05,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [39:12<21:51:04, 4.51s/it]g-point operations will not be computed-15 20:37:05,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [39:12<21:51:04, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:16,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:16,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:19<26:00:19, 5.37s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:19<26:00:19, 5.37s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:19<26:00:19, 5.37s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:19<26:00:19, 5.37s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:19<26:00:19, 5.37s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:26<28:50:18, 5.95s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:26<28:50:18, 5.95s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:26<28:50:18, 5.95s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:26<28:50:18, 5.95s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:26<28:50:18, 5.95s/it]g-point operations will not be computed-15 20:37:13,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [39:34<30:38:46, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [39:34<30:38:46, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [39:34<30:38:46, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [39:34<30:38:46, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [39:41<31:51:38, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [39:41<31:51:38, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [39:41<31:51:38, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:47,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:47,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2314, 'learning_rate': 1.2180000000000002e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:47,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:47,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:47,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [39:55<33:06:52, 6.84s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [39:55<33:06:52, 6.84s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:37:59,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [40:02<33:30:34, 6.92s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [40:02<33:30:34, 6.92s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1361, 'learning_rate': 1.224e-05, 'epoch': 0.46} + 2%|█▋ | 408/17840 [40:02<33:30:34, 6.92s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [40:02<33:30:34, 6.92s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [40:02<33:30:34, 6.92s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [40:09<33:34:00, 6.93s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:12,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:12,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:12,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [40:16<33:32:54, 6.93s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [40:16<33:32:54, 6.93s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [40:16<33:32:54, 6.93s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:22,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:22,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1668, 'learning_rate': 1.2329999999999999e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:22,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:22,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:22,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [40:30<33:23:22, 6.90s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [40:30<33:23:22, 6.90s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:34,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [40:36<33:14:30, 6.87s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [40:36<33:14:30, 6.87s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0757, 'learning_rate': 1.239e-05, 'epoch': 0.46} + 2%|█▊ | 413/17840 [40:36<33:14:30, 6.87s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:42,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:42,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0394, 'learning_rate': 1.242e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:42,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:42,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:42,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [40:50<33:01:56, 6.82s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:53,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:38:53,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [40:57<32:52:58, 6.79s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [40:57<32:52:58, 6.79s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1777, 'learning_rate': 1.2479999999999999e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:01,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [41:03<32:42:25, 6.76s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [41:03<32:42:25, 6.76s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0795, 'learning_rate': 1.251e-05, 'epoch': 0.47} + 2%|█▊ | 417/17840 [41:03<32:42:25, 6.76s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:09,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:09,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1362, 'learning_rate': 1.254e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:09,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:09,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [41:17<32:22:52, 6.69s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [41:17<32:22:52, 6.69s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:19,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:19,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 420/17840 [41:23<32:14:51, 6.66s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 420/17840 [41:23<32:14:51, 6.66s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1196, 'learning_rate': 1.26e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:27,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [41:30<32:07:36, 6.64s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [41:30<32:07:36, 6.64s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1635, 'learning_rate': 1.263e-05, 'epoch': 0.47} + 2%|█▊ | 421/17840 [41:30<32:07:36, 6.64s/it]g-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:36,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:36,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1899, 'learning_rate': 1.2659999999999999e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:36,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:42,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:42,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1576, 'learning_rate': 1.269e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:42,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.125, 'learning_rate': 1.272e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1386, 'learning_rate': 1.275e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-15 20:39:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:03,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:03,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:06,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:06,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:37:35,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [42:10<31:57:14, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:10,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [42:10<31:57:14, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:10,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0452, 'learning_rate': 1.281e-05, 'epoch': 0.48} + 2%|█▊ | 427/17840 [42:10<31:57:14, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:10,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [42:10<31:57:14, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:10,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [42:16<31:23:07, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:17,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [42:16<31:23:07, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:17,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [42:16<31:23:07, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:17,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [42:16<31:23:07, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:17,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 429/17840 [42:22<30:52:53, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:23,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 429/17840 [42:22<30:52:53, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:23,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 429/17840 [42:22<30:52:53, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:23,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [42:28<30:28:17, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:29,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [42:28<30:28:17, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:29,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.116, 'learning_rate': 1.29e-05, 'epoch': 0.48} + 2%|█▊ | 430/17840 [42:28<30:28:17, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:29,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [42:28<30:28:17, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:29,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [42:34<30:14:03, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:35,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [42:34<30:14:03, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:35,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [42:34<30:14:03, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:35,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [42:34<30:14:03, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:35,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [42:40<30:01:57, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [42:40<30:01:57, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [42:40<30:01:57, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [42:40<30:01:57, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [42:46<29:47:26, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [42:46<29:47:26, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0518, 'learning_rate': 1.302e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:57,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:40:57,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0114, 'learning_rate': 1.305e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:02,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:02,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 436/17840 [43:04<28:25:10, 5.88s/it]g-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 436/17840 [43:04<28:25:10, 5.88s/it]g-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:07,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:07,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 437/17840 [43:09<28:00:43, 5.79s/it]g-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:11,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:14,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:14,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.142, 'learning_rate': 1.314e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:18,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:18,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 439/17840 [43:20<26:57:50, 5.58s/it]g-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:22,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:24,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:24,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0925, 'learning_rate': 1.32e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:28,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:28,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:40:47,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [43:30<25:21:23, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [43:30<25:21:23, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [43:30<25:21:23, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:34,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:36,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:38,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:38,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:40,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:42,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:42,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:46,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:48,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:48,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:49,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:52,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:52,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:56,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:56,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:41:58,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:01,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:01,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5794, 'learning_rate': 1.3500000000000001e-05, 'epoch': 0.5} +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:04,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:04,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:08,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:08,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2045, 'learning_rate': 1.3530000000000001e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:12,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:12,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:12,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [44:16<25:41:34, 5.32s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:19,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:19,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 453/17840 [44:23<28:26:52, 5.89s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 453/17840 [44:23<28:26:52, 5.89s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3452, 'learning_rate': 1.359e-05, 'epoch': 0.51} + 3%|█▉ | 453/17840 [44:23<28:26:52, 5.89s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 453/17840 [44:23<28:26:52, 5.89s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 453/17840 [44:23<28:26:52, 5.89s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [44:30<30:08:45, 6.24s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:33,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:33,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [44:37<31:09:04, 6.45s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [44:37<31:09:04, 6.45s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2512, 'learning_rate': 1.3650000000000001e-05, 'epoch': 0.51} + 3%|█▉ | 455/17840 [44:37<31:09:04, 6.45s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.241, 'learning_rate': 1.3680000000000001e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [44:51<32:28:01, 6.72s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [44:51<32:28:01, 6.72s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:42:56,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [44:58<32:48:46, 6.80s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [44:58<32:48:46, 6.80s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1163, 'learning_rate': 1.374e-05, 'epoch': 0.51} + 3%|█▉ | 458/17840 [44:58<32:48:46, 6.80s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [44:58<32:48:46, 6.80s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [44:58<32:48:46, 6.80s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [45:05<33:04:05, 6.85s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:08,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:08,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 460/17840 [45:12<33:01:17, 6.84s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 460/17840 [45:12<33:01:17, 6.84s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1374, 'learning_rate': 1.3800000000000002e-05, 'epoch': 0.52} + 3%|█▉ | 460/17840 [45:12<33:01:17, 6.84s/it]g-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:18,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:18,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9847, 'learning_rate': 1.3830000000000001e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:18,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:18,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:18,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:41:30,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 462/17840 [45:26<32:53:45, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 462/17840 [45:26<32:53:45, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 462/17840 [45:26<32:53:45, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [45:32<32:46:46, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [45:32<32:46:46, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9789, 'learning_rate': 1.389e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:37,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [45:39<32:31:43, 6.74s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [45:39<32:31:43, 6.74s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9773, 'learning_rate': 1.392e-05, 'epoch': 0.52} + 3%|█▉ | 464/17840 [45:39<32:31:43, 6.74s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:45,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:45,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0705, 'learning_rate': 1.395e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:45,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:45,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:45,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [45:52<32:19:23, 6.70s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:55,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:43:55,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [45:59<32:11:04, 6.67s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [45:59<32:11:04, 6.67s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0037, 'learning_rate': 1.4010000000000001e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:03,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [46:06<32:03:46, 6.64s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [46:06<32:03:46, 6.64s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0776, 'learning_rate': 1.4040000000000001e-05, 'epoch': 0.52} + 3%|█▉ | 468/17840 [46:06<32:03:46, 6.64s/it]g-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:11,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:11,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9931, 'learning_rate': 1.4069999999999999e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:11,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:11,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:11,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:43:27,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [46:19<31:58:22, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [46:19<31:58:22, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [46:19<31:58:22, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [46:19<31:58:22, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [46:25<31:47:42, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:28,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:28,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [46:32<31:40:16, 6.56s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [46:32<31:40:16, 6.56s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:34,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:34,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [46:38<31:30:44, 6.53s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [46:38<31:30:44, 6.53s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0239, 'learning_rate': 1.419e-05, 'epoch': 0.53} + 3%|██ | 473/17840 [46:38<31:30:44, 6.53s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:44,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:44,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9477, 'learning_rate': 1.422e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:44,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:44,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [46:52<32:43:13, 6.78s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [46:52<32:43:13, 6.78s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0898, 'learning_rate': 1.4249999999999999e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-15 20:44:56,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [46:58<32:05:41, 6.65s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [46:58<32:05:41, 6.65s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:01,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:01,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [47:05<31:26:58, 6.52s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [47:05<31:26:58, 6.52s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1733, 'learning_rate': 1.431e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:08,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [47:11<30:57:48, 6.42s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [47:11<30:57:48, 6.42s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:13,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:13,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 479/17840 [47:17<30:25:21, 6.31s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 479/17840 [47:17<30:25:21, 6.31s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9384, 'learning_rate': 1.437e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:21,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [47:23<30:08:52, 6.25s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [47:23<30:08:52, 6.25s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9788, 'learning_rate': 1.44e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:27,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [47:29<29:44:24, 6.17s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [47:29<29:44:24, 6.17s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9565, 'learning_rate': 1.4429999999999999e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:33,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 482/17840 [47:35<29:26:06, 6.10s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 482/17840 [47:35<29:26:06, 6.10s/it]g-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:37,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:37,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:44:20,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 483/17840 [47:41<28:58:39, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 483/17840 [47:41<28:58:39, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0223, 'learning_rate': 1.449e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:46,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:46,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0351, 'learning_rate': 1.452e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:46,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:51,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:51,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.052, 'learning_rate': 1.455e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-15 20:45:56,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 486/17840 [47:58<27:49:08, 5.77s/it]g-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 486/17840 [47:58<27:49:08, 5.77s/it]g-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:00,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:00,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:00,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:45:41,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 487/17840 [48:03<27:22:04, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:04,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 487/17840 [48:03<27:22:04, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:04,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 487/17840 [48:03<27:22:04, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:04,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:08,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:04,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:10,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:04,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:10,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:04,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:10,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:04,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 489/17840 [48:14<26:08:36, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:16,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:16,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 490/17840 [48:18<25:24:00, 5.27s/it]g-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:20,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:22,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:22,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9478, 'learning_rate': 1.473e-05, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:26,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:26,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:14,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 492/17840 [48:28<23:30:39, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:28,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:30,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:28,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:30,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:28,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 493/17840 [48:32<22:19:40, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:32,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 493/17840 [48:32<22:19:40, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:32,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 494/17840 [48:35<20:57:28, 4.35s/it]g-point operations will not be computed-15 20:46:32,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 494/17840 [48:35<20:57:28, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:35,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 494/17840 [48:35<20:57:28, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:35,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 495/17840 [48:39<19:34:00, 4.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:39,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:40,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:39,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:40,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:39,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 496/17840 [48:42<18:12:44, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:42,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 496/17840 [48:42<18:12:44, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:42,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 497/17840 [48:45<16:54:22, 3.51s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:45,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 497/17840 [48:45<16:54:22, 3.51s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:45,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 498/17840 [48:47<15:31:40, 3.22s/it]g-point operations will not be computed-15 20:46:45,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 498/17840 [48:47<15:31:40, 3.22s/it]g-point operations will not be computed-15 20:46:45,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 499/17840 [48:50<14:20:03, 2.98s/it]g-point operations will not be computed-15 20:46:47,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:50,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:49,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:50,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:49,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [48:53<14:58:18, 3.11s/it]g-point operations will not be computed-15 20:46:49,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [48:53<14:58:18, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:54,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [48:53<14:58:18, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:46:54,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:58,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:54,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:46:58,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:46:54,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [49:01<21:23:02, 4.44s/it]g-point operations will not be computed-15 20:46:54,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [49:01<21:23:02, 4.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:02,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [49:01<21:23:02, 4.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:02,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [49:08<25:40:06, 5.33s/it]g-point operations will not be computed-15 20:47:02,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [49:08<25:40:06, 5.33s/it]g-point operations will not be computed-15 20:47:02,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [49:08<25:40:06, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [49:08<25:40:06, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [49:08<25:40:06, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [49:08<25:40:06, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 503/17840 [49:15<28:28:52, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 503/17840 [49:15<28:28:52, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 503/17840 [49:15<28:28:52, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:22,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:22,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2604, 'learning_rate': 1.5120000000000001e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:22,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:22,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:22,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [49:29<31:22:45, 6.52s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:32,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:32,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:36<32:00:17, 6.65s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:36<32:00:17, 6.65s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1748, 'learning_rate': 1.518e-05, 'epoch': 0.57} + 3%|██▏ | 506/17840 [49:36<32:00:17, 6.65s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:36<32:00:17, 6.65s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:36<32:00:17, 6.65s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [49:44<32:40:27, 6.79s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:46,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:47:46,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [49:51<33:00:47, 6.86s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [49:51<33:00:47, 6.86s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0013, 'learning_rate': 1.524e-05, 'epoch': 0.57} + 3%|██▏ | 508/17840 [49:51<33:00:47, 6.86s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [49:51<33:00:47, 6.86s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [49:51<33:00:47, 6.86s/it]g-point operations will not be computed-15 20:47:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:58<33:09:22, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:58<33:09:22, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:58<33:09:22, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 510/17840 [50:05<33:19:22, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 510/17840 [50:05<33:19:22, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0265, 'learning_rate': 1.53e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-15 20:48:09,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [50:11<33:16:08, 6.91s/it]g-point operations will not be computed-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [50:11<33:16:08, 6.91s/it]g-point operations will not be computed-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9898, 'learning_rate': 1.533e-05, 'epoch': 0.57} + 3%|██▏ | 511/17840 [50:11<33:16:08, 6.91s/it]g-point operations will not be computed-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [50:11<33:16:08, 6.91s/it]g-point operations will not be computed-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [50:11<33:16:08, 6.91s/it]g-point operations will not be computed-15 20:47:58,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [50:18<33:09:43, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [50:18<33:09:43, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [50:18<33:09:43, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [50:25<32:57:13, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [50:25<32:57:13, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1465, 'learning_rate': 1.539e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-15 20:48:29,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [50:32<32:51:46, 6.83s/it]g-point operations will not be computed-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [50:32<32:51:46, 6.83s/it]g-point operations will not be computed-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0691, 'learning_rate': 1.542e-05, 'epoch': 0.58} + 3%|██▏ | 514/17840 [50:32<32:51:46, 6.83s/it]g-point operations will not be computed-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [50:32<32:51:46, 6.83s/it]g-point operations will not be computed-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [50:32<32:51:46, 6.83s/it]g-point operations will not be computed-15 20:48:19,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [50:39<32:43:30, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [50:39<32:43:30, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [50:39<32:43:30, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [50:45<32:37:51, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [50:45<32:37:51, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:48:48,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:48:48,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [50:52<32:34:20, 6.77s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [50:52<32:34:20, 6.77s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0741, 'learning_rate': 1.5510000000000002e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-15 20:48:56,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [50:59<32:23:18, 6.73s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [50:59<32:23:18, 6.73s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9386, 'learning_rate': 1.554e-05, 'epoch': 0.58} + 3%|██▏ | 518/17840 [50:59<32:23:18, 6.73s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:04,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:04,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:04,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1078, 'learning_rate': 1.5570000000000002e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:04,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [51:12<31:58:59, 6.65s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [51:12<31:58:59, 6.65s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [51:18<31:47:00, 6.61s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:21,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:21,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:21,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [51:25<31:30:15, 6.55s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [51:25<31:30:15, 6.55s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:29,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:29,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [51:31<31:23:39, 6.53s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [51:31<31:23:39, 6.53s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:35,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:38<31:13:37, 6.49s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:38<31:13:37, 6.49s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9398, 'learning_rate': 1.5720000000000002e-05, 'epoch': 0.59} + 3%|██▏ | 524/17840 [51:38<31:13:37, 6.49s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:38<31:13:37, 6.49s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:38<31:13:37, 6.49s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [51:45<32:54:49, 6.84s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [51:45<32:54:49, 6.84s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:49,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:49,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 526/17840 [51:52<32:10:58, 6.69s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 526/17840 [51:52<32:10:58, 6.69s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 526/17840 [51:52<32:10:58, 6.69s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:57,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:57,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9909, 'learning_rate': 1.5810000000000003e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-15 20:49:57,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:03,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:03,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0464, 'learning_rate': 1.584e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:03,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:10,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:10,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0722, 'learning_rate': 1.5870000000000002e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:10,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0954, 'learning_rate': 1.59e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:22,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:22,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.962, 'learning_rate': 1.593e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:26,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 532/17840 [52:29<29:38:53, 6.17s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 532/17840 [52:29<29:38:53, 6.17s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9215, 'learning_rate': 1.596e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:32,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:32,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 533/17840 [52:34<29:13:43, 6.08s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:37,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:37,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:37,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 534/17840 [52:40<28:45:19, 5.98s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:42,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:42,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:42,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 535/17840 [52:46<28:20:09, 5.89s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:48,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:51,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:51,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0719, 'learning_rate': 1.6080000000000002e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:55,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [52:57<27:29:40, 5.72s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [52:57<27:29:40, 5.72s/it]g-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:59,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:59,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:50:59,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:48:39,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 538/17840 [53:02<26:54:01, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 538/17840 [53:02<26:54:01, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:07,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:07,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:09,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:09,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:09,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 540/17840 [53:12<25:12:45, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:13,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:15,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:13,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:15,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:13,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 541/17840 [53:17<24:05:20, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:17,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:19,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:17,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:19,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:17,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 542/17840 [53:21<22:56:03, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:21,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:23,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:21,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:23,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:21,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 543/17840 [53:25<21:44:13, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:25,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:27,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:25,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:27,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:25,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 544/17840 [53:28<20:20:53, 4.24s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:28,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 545/17840 [53:32<18:50:07, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:32,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 545/17840 [53:32<18:50:07, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:32,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:33,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:32,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:33,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:32,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 546/17840 [53:35<17:24:51, 3.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:34,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 547/17840 [53:37<16:10:34, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:37,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 547/17840 [53:37<16:10:34, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:37,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 548/17840 [53:40<15:01:51, 3.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:40,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 548/17840 [53:40<15:01:51, 3.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:40,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 549/17840 [53:42<13:54:23, 2.90s/it]g-point operations will not be computed-15 20:51:40,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 549/17840 [53:42<13:54:23, 2.90s/it]g-point operations will not be computed-15 20:51:40,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:43,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:42,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [53:46<14:23:27, 3.00s/it]g-point operations will not be computed-15 20:51:42,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [53:46<14:23:27, 3.00s/it]g-point operations will not be computed-15 20:51:42,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [53:46<14:23:27, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:47,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [53:46<14:23:27, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:47,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:50,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:47,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:50,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:47,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [53:53<20:55:15, 4.36s/it]g-point operations will not be computed-15 20:51:47,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [53:53<20:55:15, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:51:54,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:51:58,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:51:54,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [54:00<25:04:29, 5.22s/it]g-point operations will not be computed-15 20:51:54,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [54:00<25:04:29, 5.22s/it]g-point operations will not be computed-15 20:51:54,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [54:00<25:04:29, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [54:00<25:04:29, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [54:00<25:04:29, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [54:00<25:04:29, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 553/17840 [54:07<27:58:06, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 553/17840 [54:07<27:58:06, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 553/17840 [54:07<27:58:06, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:14,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:14,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1877, 'learning_rate': 1.6620000000000004e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:14,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:14,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:14,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [54:22<31:00:13, 6.46s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:24,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:24,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:29<31:50:42, 6.63s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:29<31:50:42, 6.63s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0755, 'learning_rate': 1.6680000000000003e-05, 'epoch': 0.62} + 3%|██▎ | 556/17840 [54:29<31:50:42, 6.63s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:29<31:50:42, 6.63s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:29<31:50:42, 6.63s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [54:35<32:07:46, 6.69s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:38,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:38,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [54:42<32:28:31, 6.76s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [54:42<32:28:31, 6.76s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0437, 'learning_rate': 1.6740000000000002e-05, 'epoch': 0.63} + 3%|██▍ | 558/17840 [54:42<32:28:31, 6.76s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:48,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:48,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9926, 'learning_rate': 1.677e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:48,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:48,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 560/17840 [54:56<32:55:49, 6.86s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 560/17840 [54:56<32:55:49, 6.86s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:59,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:52:59,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 561/17840 [55:03<32:58:54, 6.87s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 561/17840 [55:03<32:58:54, 6.87s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0338, 'learning_rate': 1.6830000000000003e-05, 'epoch': 0.63} + 3%|██▍ | 561/17840 [55:03<32:58:54, 6.87s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:09,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:09,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9071, 'learning_rate': 1.686e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:09,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:09,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [55:17<32:36:13, 6.79s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [55:17<32:36:13, 6.79s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:19,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:19,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [55:23<32:27:40, 6.76s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [55:23<32:27:40, 6.76s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9716, 'learning_rate': 1.6919999999999997e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:28,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [55:30<32:19:00, 6.73s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [55:30<32:19:00, 6.73s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1159, 'learning_rate': 1.695e-05, 'epoch': 0.63} + 3%|██▍ | 565/17840 [55:30<32:19:00, 6.73s/it]g-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:36,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:36,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8501, 'learning_rate': 1.698e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:36,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:36,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:36,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:52:01,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [55:43<31:55:28, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [55:43<31:55:28, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [55:43<31:55:28, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [55:43<31:55:28, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [55:50<31:54:46, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:52,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:52,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:53:52,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 569/17840 [55:56<31:41:41, 6.61s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 569/17840 [55:56<31:41:41, 6.61s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:00,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:00,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 570/17840 [56:03<31:33:40, 6.58s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 570/17840 [56:03<31:33:40, 6.58s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:07,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [56:09<31:30:05, 6.57s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [56:09<31:30:05, 6.57s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9117, 'learning_rate': 1.713e-05, 'epoch': 0.64} + 3%|██▍ | 571/17840 [56:09<31:30:05, 6.57s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:15,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:15,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0433, 'learning_rate': 1.716e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:15,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:21,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:21,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9053, 'learning_rate': 1.719e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:21,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:28,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:28,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8068, 'learning_rate': 1.7219999999999998e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:28,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:54:28,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [56:36<32:33:08, 6.79s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [56:36<32:33:08, 6.79s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9769, 'learning_rate': 1.725e-05, 'epoch': 0.64} + 3%|██▍ | 575/17840 [56:36<32:33:08, 6.79s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [56:36<32:33:08, 6.79s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [56:36<32:33:08, 6.79s/it]g-point operations will not be computed-15 20:53:44,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [56:42<31:54:14, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:43,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [56:42<31:54:14, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:43,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [56:42<31:54:14, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:43,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [56:42<31:54:14, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:43,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [56:49<31:22:54, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:50,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [56:49<31:22:54, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:50,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [56:49<31:22:54, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:50,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [56:49<31:22:54, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:50,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [56:55<30:54:37, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:56,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [56:55<30:54:37, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:56,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [56:55<30:54:37, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:56,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [56:55<30:54:37, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:54:56,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [57:01<30:37:38, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:02,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [57:01<30:37:38, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:02,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [57:01<30:37:38, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:02,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [57:01<30:37:38, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:02,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [57:07<30:29:13, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:08,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [57:07<30:29:13, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:08,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [57:07<30:29:13, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:08,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [57:07<30:29:13, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:08,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [57:14<30:03:47, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [57:14<30:03:47, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:19,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:19,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9448, 'learning_rate': 1.746e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:19,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:25,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:25,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8553, 'learning_rate': 1.749e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:29,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 584/17840 [57:31<28:45:44, 6.00s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 584/17840 [57:31<28:45:44, 6.00s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9643, 'learning_rate': 1.7519999999999998e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:35,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 585/17840 [57:37<28:12:10, 5.88s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 585/17840 [57:37<28:12:10, 5.88s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9874, 'learning_rate': 1.755e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:40,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 586/17840 [57:42<27:50:12, 5.81s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 586/17840 [57:42<27:50:12, 5.81s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:44,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:47,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:47,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9909, 'learning_rate': 1.761e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:51,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 588/17840 [57:53<26:46:21, 5.59s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 588/17840 [57:53<26:46:21, 5.59s/it]g-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:55,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:55,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:55:55,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:14,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 589/17840 [57:58<26:14:20, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:59,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 589/17840 [57:58<26:14:20, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:55:59,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:03,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:59,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:03,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:59,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9174, 'learning_rate': 1.77e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:06,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:59,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:06,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:55:59,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 591/17840 [58:08<25:01:22, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:56:09,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:11,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:09,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 592/17840 [58:13<24:14:14, 5.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 592/17840 [58:13<24:14:14, 5.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.969, 'learning_rate': 1.776e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:17,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:17,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:19,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:21,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:21,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:23,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:24,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:24,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:28,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:28,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:29,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:31,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:31,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:33,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:33,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:35,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:35,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:37,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:39,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:39,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2943, 'learning_rate': 1.8e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:43,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:43,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:46,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:46,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:50,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:50,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:50,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:54,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:54,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:54,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:54,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:56:54,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [59:02<28:04:39, 5.86s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [59:02<28:04:39, 5.86s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:06,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:06,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [59:09<30:00:01, 6.27s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [59:09<30:00:01, 6.27s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [59:09<30:00:01, 6.27s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [59:09<30:00:01, 6.27s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [59:09<30:00:01, 6.27s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [59:16<31:09:26, 6.51s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:19,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:19,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:19,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [59:23<31:58:01, 6.68s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [59:23<31:58:01, 6.68s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [59:23<31:58:01, 6.68s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:29,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:29,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0184, 'learning_rate': 1.821e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:33,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:33,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:33,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [59:37<32:34:34, 6.81s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [59:37<32:34:34, 6.81s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [59:44<32:43:44, 6.84s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [59:44<32:43:44, 6.84s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9952, 'learning_rate': 1.827e-05, 'epoch': 0.68} + 3%|██▌ | 609/17840 [59:44<32:43:44, 6.84s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:50,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:50,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9445, 'learning_rate': 1.83e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:53,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:53,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:57:53,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [59:57<32:41:50, 6.83s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [59:57<32:41:50, 6.83s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:02,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:00:04<32:31:19, 6.80s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:00:04<32:31:19, 6.80s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9696, 'learning_rate': 1.836e-05, 'epoch': 0.69} + 3%|██▌ | 612/17840 [1:00:04<32:31:19, 6.80s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:00:04<32:31:19, 6.80s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:00:04<32:31:19, 6.80s/it]g-point operations will not be computed-15 20:56:13,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:00:11<32:25:48, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:00:11<32:25:48, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:00:11<32:25:48, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:00:11<32:25:48, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [1:00:17<32:17:06, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:20,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:20,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 615/17840 [1:00:24<32:18:30, 6.75s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 615/17840 [1:00:24<32:18:30, 6.75s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.127, 'learning_rate': 1.845e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:28,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:00:31<32:05:23, 6.71s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:00:31<32:05:23, 6.71s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8424, 'learning_rate': 1.848e-05, 'epoch': 0.69} + 3%|██▌ | 616/17840 [1:00:31<32:05:23, 6.71s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:37,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:37,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9533, 'learning_rate': 1.851e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:37,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:37,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:37,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 618/17840 [1:00:44<31:51:41, 6.66s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:47,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:47,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 619/17840 [1:00:51<31:48:20, 6.65s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 619/17840 [1:00:51<31:48:20, 6.65s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9121, 'learning_rate': 1.857e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-15 20:58:55,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:00:57<31:39:37, 6.62s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:00:57<31:39:37, 6.62s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.961, 'learning_rate': 1.86e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:01,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:01:04<31:26:47, 6.57s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:01:04<31:26:47, 6.57s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9808, 'learning_rate': 1.863e-05, 'epoch': 0.7} + 3%|██▌ | 621/17840 [1:01:04<31:26:47, 6.57s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:01:04<31:26:47, 6.57s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:01:04<31:26:47, 6.57s/it]g-point operations will not be computed-15 20:58:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:01:10<31:16:14, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:01:10<31:16:14, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:01:10<31:16:14, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:01:10<31:16:14, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:01:17<31:04:22, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:19,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:19,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:19,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 624/17840 [1:01:23<30:52:40, 6.46s/it]g-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:25,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:25,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:25,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:25,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0441, 'learning_rate': 1.8750000000000002e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:25,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:25,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 20:59:25,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 20:59:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 626/17840 [1:01:37<31:53:38, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:38,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 626/17840 [1:01:37<31:53:38, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:38,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 626/17840 [1:01:37<31:53:38, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:38,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 626/17840 [1:01:37<31:53:38, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:38,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:01:43<31:11:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:44,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:01:43<31:11:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:44,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:01:43<31:11:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:44,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:01:43<31:11:57, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:44,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:01:49<30:42:21, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:50,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:01:49<30:42:21, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:50,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:01:49<30:42:21, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:50,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:01:49<30:42:21, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:50,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 629/17840 [1:01:55<30:20:57, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:56,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 629/17840 [1:01:55<30:20:57, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:56,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 629/17840 [1:01:55<30:20:57, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 20:59:56,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:02:02<30:07:03, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:02,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:02:02<30:07:03, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:02,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1287, 'learning_rate': 1.8900000000000002e-05, 'epoch': 0.71} + 4%|██▌ | 630/17840 [1:02:02<30:07:03, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:02,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:02:02<30:07:03, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:02,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:02:08<29:51:15, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:02:08<29:51:15, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:13,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:13,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7483, 'learning_rate': 1.896e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:13,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:13,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:13,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:02:20<29:08:44, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:02:20<29:08:44, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:25,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:25,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8727, 'learning_rate': 1.902e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:25,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:31,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:31,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9919, 'learning_rate': 1.9050000000000002e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:35,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 636/17840 [1:02:37<28:07:39, 5.89s/it]g-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 636/17840 [1:02:37<28:07:39, 5.89s/it]g-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:39,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:39,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:20,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 637/17840 [1:02:43<27:41:50, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 637/17840 [1:02:43<27:41:50, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9519, 'learning_rate': 1.911e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:47,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:47,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8088, 'learning_rate': 1.914e-05, 'epoch': 0.72} +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:47,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:53,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:53,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:00:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:43,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 640/17840 [1:02:59<26:06:26, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 640/17840 [1:02:59<26:06:26, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:03,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:03,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:05,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:08,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:08,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0427, 'learning_rate': 1.9260000000000002e-05, 'epoch': 0.72} +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:11,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:11,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:00:59,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 643/17840 [1:03:13<23:19:29, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:13,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 644/17840 [1:03:17<22:08:09, 4.63s/it]g-point operations will not be computed-15 21:01:13,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 644/17840 [1:03:17<22:08:09, 4.63s/it]g-point operations will not be computed-15 21:01:13,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 644/17840 [1:03:17<22:08:09, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:17,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [1:03:20<20:47:17, 4.35s/it]g-point operations will not be computed-15 21:01:17,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [1:03:20<20:47:17, 4.35s/it]g-point operations will not be computed-15 21:01:17,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [1:03:20<20:47:17, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:21,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 646/17840 [1:03:24<19:23:42, 4.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:24,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 646/17840 [1:03:24<19:23:42, 4.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:24,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 647/17840 [1:03:27<17:56:43, 3.76s/it]g-point operations will not be computed-15 21:01:24,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 647/17840 [1:03:27<17:56:43, 3.76s/it]g-point operations will not be computed-15 21:01:24,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:28,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:27,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 648/17840 [1:03:30<16:28:41, 3.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:29,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 648/17840 [1:03:30<16:28:41, 3.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:29,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 649/17840 [1:03:32<14:55:57, 3.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:32,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 649/17840 [1:03:32<14:55:57, 3.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:32,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:33,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:32,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 650/17840 [1:03:35<15:05:38, 3.16s/it]g-point operations will not be computed-15 21:01:32,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 650/17840 [1:03:35<15:05:38, 3.16s/it]g-point operations will not be computed-15 21:01:32,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 650/17840 [1:03:35<15:05:38, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:37,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:40,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:37,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 651/17840 [1:03:43<21:31:26, 4.51s/it]g-point operations will not be computed-15 21:01:37,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 651/17840 [1:03:43<21:31:26, 4.51s/it]g-point operations will not be computed-15 21:01:37,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 651/17840 [1:03:43<21:31:26, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 651/17840 [1:03:43<21:31:26, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:48,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:48,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 652/17840 [1:03:50<25:33:04, 5.35s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 652/17840 [1:03:50<25:33:04, 5.35s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:01:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:57<28:13:30, 5.91s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:57<28:13:30, 5.91s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:57<28:13:30, 5.91s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:57<28:13:30, 5.91s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:57<28:13:30, 5.91s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:04:04<29:55:56, 6.27s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:04:04<29:55:56, 6.27s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:09,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 655/17840 [1:04:12<31:12:05, 6.54s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 655/17840 [1:04:12<31:12:05, 6.54s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0325, 'learning_rate': 1.965e-05, 'epoch': 0.73} + 4%|██▋ | 655/17840 [1:04:12<31:12:05, 6.54s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 655/17840 [1:04:12<31:12:05, 6.54s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 655/17840 [1:04:12<31:12:05, 6.54s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:04:19<31:55:02, 6.69s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:04:19<31:55:02, 6.69s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:23,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:23,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:26<32:25:01, 6.79s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:26<32:25:01, 6.79s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:26<32:25:01, 6.79s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:26<32:25:01, 6.79s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:26<32:25:01, 6.79s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:04:33<32:41:34, 6.85s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:35,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:35,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:35,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:04:40<32:47:29, 6.87s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:04:40<32:47:29, 6.87s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:04:40<32:47:29, 6.87s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:46,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:46,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.827, 'learning_rate': 1.98e-05, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:46,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:46,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:46,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:04:53<32:54:18, 6.90s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:04:53<32:54:18, 6.90s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:58,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:02:58,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:05:00<32:45:25, 6.86s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:05:00<32:45:25, 6.86s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:05:00<32:45:25, 6.86s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:06,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:06,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9525, 'learning_rate': 1.989e-05, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:06,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:06,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:06,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 664/17840 [1:05:14<32:24:42, 6.79s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:05:21<32:21:26, 6.78s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:05:21<32:21:26, 6.78s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:25,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:05:27<32:03:47, 6.72s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:05:27<32:03:47, 6.72s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9609, 'learning_rate': 1.9980000000000002e-05, 'epoch': 0.75} + 4%|██▊ | 666/17840 [1:05:27<32:03:47, 6.72s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:33,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:33,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8846, 'learning_rate': 2.0010000000000003e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:33,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:39,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:39,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7979, 'learning_rate': 2.004e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:39,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:39,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:05:47<31:42:01, 6.65s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:05:47<31:42:01, 6.65s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:49,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:49,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [1:05:53<31:27:27, 6.60s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [1:05:53<31:27:27, 6.60s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8455, 'learning_rate': 2.01e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-15 21:03:57,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:06:00<31:16:35, 6.56s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:06:00<31:16:35, 6.56s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7517, 'learning_rate': 2.0130000000000002e-05, 'epoch': 0.75} + 4%|██▊ | 671/17840 [1:06:00<31:16:35, 6.56s/it]g-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:06,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:06,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8857, 'learning_rate': 2.016e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:06,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:12,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:12,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8616, 'learning_rate': 2.019e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:12,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:12,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:12,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:01:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:06:19<30:46:48, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:06:19<30:46:48, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:06:19<30:46:48, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:06:19<30:46:48, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:06:27<32:32:42, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:06:27<32:32:42, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:06:27<32:32:42, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:06:27<32:32:42, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:32,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:32,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:32,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:32,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:39,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:39,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:39,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:39,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:04:39,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:04:20,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:06:46<30:54:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:47,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:06:46<30:54:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:47,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:06:46<30:54:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:47,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:06:46<30:54:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:47,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:06:52<30:26:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:06:52<30:26:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:06:52<30:26:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:06:52<30:26:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:06:58<30:02:28, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:59,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:06:58<30:02:28, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:59,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:06:58<30:02:28, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:59,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:06:58<30:02:28, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:04:59,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:07:04<29:48:26, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:05,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:07:04<29:48:26, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:05,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:07:04<29:48:26, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:05,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:07:04<29:48:26, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:05,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:07:10<29:29:19, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:07:10<29:29:19, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:07:10<29:29:19, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:15,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:15,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:20,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:20,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 684/17840 [1:07:22<28:38:42, 6.01s/it]g-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 684/17840 [1:07:22<28:38:42, 6.01s/it]g-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:25,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:25,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 685/17840 [1:07:28<28:14:20, 5.93s/it]g-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 685/17840 [1:07:28<28:14:20, 5.93s/it]g-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:31,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:31,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 686/17840 [1:07:33<27:52:11, 5.85s/it]g-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:35,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:35,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:35,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:11,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:07:39<27:23:32, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:39,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:07:39<27:23:32, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:39,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:07:39<27:23:32, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:39,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:43,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:39,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:43,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:39,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:48,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:39,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:48,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:39,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 689/17840 [1:07:50<26:29:11, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:50,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 689/17840 [1:07:50<26:29:11, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:50,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 689/17840 [1:07:50<26:29:11, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:05:50,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:54,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:50,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:54,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:50,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:58,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:50,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:05:58,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:05:50,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 691/17840 [1:08:00<25:14:10, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 691/17840 [1:08:00<25:14:10, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 691/17840 [1:08:00<25:14:10, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:04,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:06,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:06,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:08,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:10,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:10,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:12,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:14,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:14,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:16,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:17,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:17,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:19,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:22,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:22,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:23,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:23,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:26,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:26,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:28,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:30,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:30,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1269, 'learning_rate': 2.1e-05, 'epoch': 0.78} +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:34,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:34,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:38,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:38,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2143, 'learning_rate': 2.103e-05, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:42,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:42,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:42,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:08:46<25:38:14, 5.39s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:08:46<25:38:14, 5.39s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:06:51,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:54<28:16:55, 5.94s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:54<28:16:55, 5.94s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1069, 'learning_rate': 2.109e-05, 'epoch': 0.79} + 4%|██▉ | 703/17840 [1:08:54<28:16:55, 5.94s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:54<28:16:55, 5.94s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:54<28:16:55, 5.94s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:09:01<30:00:03, 6.30s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:09:01<30:00:03, 6.30s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:05,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:09:08<31:20:30, 6.58s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:09:08<31:20:30, 6.58s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9455, 'learning_rate': 2.115e-05, 'epoch': 0.79} + 4%|██▉ | 705/17840 [1:09:08<31:20:30, 6.58s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:09:08<31:20:30, 6.58s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:09:08<31:20:30, 6.58s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:09:15<32:02:43, 6.73s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:18,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:18,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:09:22<32:33:20, 6.84s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:09:22<32:33:20, 6.84s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9517, 'learning_rate': 2.121e-05, 'epoch': 0.79} + 4%|██▉ | 707/17840 [1:09:22<32:33:20, 6.84s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:09:22<32:33:20, 6.84s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:09:22<32:33:20, 6.84s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:09:29<32:46:27, 6.89s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:32,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:32,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:09:36<32:57:06, 6.92s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:09:36<32:57:06, 6.92s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.883, 'learning_rate': 2.1269999999999998e-05, 'epoch': 0.79} + 4%|██▉ | 709/17840 [1:09:36<32:57:06, 6.92s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:42,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:42,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8345, 'learning_rate': 2.13e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:42,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:42,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:09:50<32:56:26, 6.92s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:09:50<32:56:26, 6.92s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:53,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:07:53,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:09:57<32:48:58, 6.90s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:09:57<32:48:58, 6.90s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7168, 'learning_rate': 2.136e-05, 'epoch': 0.8} + 4%|██▉ | 712/17840 [1:09:57<32:48:58, 6.90s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:03,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:03,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7539, 'learning_rate': 2.139e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:03,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:03,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:10:10<32:39:28, 6.86s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:10:10<32:39:28, 6.86s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:13,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:13,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:10:17<32:25:15, 6.82s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:10:17<32:25:15, 6.82s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.902, 'learning_rate': 2.145e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:21,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:21,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 716/17840 [1:10:24<32:19:18, 6.80s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 716/17840 [1:10:24<32:19:18, 6.80s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 716/17840 [1:10:24<32:19:18, 6.80s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 716/17840 [1:10:24<32:19:18, 6.80s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 716/17840 [1:10:24<32:19:18, 6.80s/it]g-point operations will not be computed-15 21:06:00,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:10:31<32:13:18, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:10:31<32:13:18, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:10:31<32:13:18, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:10:31<32:13:18, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:10:37<32:02:26, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:40,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:40,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:40,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:10:44<31:49:04, 6.69s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:10:44<31:49:04, 6.69s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 720/17840 [1:10:50<31:36:39, 6.65s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 720/17840 [1:10:50<31:36:39, 6.65s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:55,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:08:55,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:10:57<31:23:33, 6.60s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:10:57<31:23:33, 6.60s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:10:57<31:23:33, 6.60s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:03,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:03,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7415, 'learning_rate': 2.166e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:03,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:03,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:03,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:11:10<31:15:50, 6.58s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:12,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:12,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:12,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:11:16<31:03:03, 6.53s/it]g-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:19,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:19,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:19,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:08:32,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:11:24<32:37:39, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:25,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:11:24<32:37:39, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:25,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:11:24<32:37:39, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:25,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:11:24<32:37:39, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:25,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:11:31<32:02:22, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:31,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:11:31<32:02:22, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:31,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:11:31<32:02:22, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:31,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:11:31<32:02:22, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:31,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 727/17840 [1:11:37<31:21:50, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 727/17840 [1:11:37<31:21:50, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 727/17840 [1:11:37<31:21:50, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 727/17840 [1:11:37<31:21:50, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 728/17840 [1:11:43<30:49:23, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:45,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:45,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:45,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 729/17840 [1:11:49<30:26:50, 6.41s/it]g-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:52,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:52,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:52,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 730/17840 [1:11:55<30:09:19, 6.34s/it]g-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:58,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:58,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:09:58,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 731/17840 [1:12:02<29:46:48, 6.27s/it]g-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:04,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:04,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:04,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:12:08<29:27:22, 6.20s/it]g-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:10,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:10,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:10,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:09:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:12:14<29:03:23, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:12:14<29:03:23, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:18,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:18,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9694, 'learning_rate': 2.202e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:23,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 735/17840 [1:12:25<28:03:30, 5.91s/it]g-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 735/17840 [1:12:25<28:03:30, 5.91s/it]g-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7573, 'learning_rate': 2.205e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:28,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 736/17840 [1:12:30<27:31:48, 5.79s/it]g-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 736/17840 [1:12:30<27:31:48, 5.79s/it]g-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:32,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:32,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:32,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 737/17840 [1:12:36<27:06:11, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:10:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 737/17840 [1:12:36<27:06:11, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:10:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:40,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:40,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8313, 'learning_rate': 2.214e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:44,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 739/17840 [1:12:46<25:56:53, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:10:47,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 739/17840 [1:12:46<25:56:53, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:10:47,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6969, 'learning_rate': 2.217e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:51,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:47,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:51,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:47,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7981, 'learning_rate': 2.22e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:54,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:47,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:54,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:47,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 741/17840 [1:12:56<24:36:32, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:10:57,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:10:59,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:10:57,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 742/17840 [1:13:01<23:49:52, 5.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 742/17840 [1:13:01<23:49:52, 5.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7834, 'learning_rate': 2.226e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:05,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:05,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:07,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:09,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:09,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:11,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:12,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:12,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:14,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:17,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:17,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:19,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:19,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:22,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:22,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:23,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:25,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:25,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:27,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:27,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.307, 'learning_rate': 2.25e-05, 'epoch': 0.84} +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:31,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:31,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:35,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:35,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0348, 'learning_rate': 2.253e-05, 'epoch': 0.84} +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:39,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:39,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:39,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:13:43<25:26:37, 5.36s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:46,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:46,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:11:46,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:50<28:10:26, 5.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:50<28:10:26, 5.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:50<28:10:26, 5.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:50<28:10:26, 5.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:50<28:10:26, 5.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:13:57<29:53:37, 6.30s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:00,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:00,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:00,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:14:05<31:14:30, 6.58s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:14:05<31:14:30, 6.58s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:14:05<31:14:30, 6.58s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:14:05<31:14:30, 6.58s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:14:05<31:14:30, 6.58s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 756/17840 [1:14:12<32:02:35, 6.75s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:15,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:15,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:15,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:14:19<32:23:51, 6.83s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:14:19<32:23:51, 6.83s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:14:19<32:23:51, 6.83s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:14:19<32:23:51, 6.83s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:14:19<32:23:51, 6.83s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 758/17840 [1:14:26<32:45:33, 6.90s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:29,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:29,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:29,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:14:33<32:48:41, 6.92s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:14:33<32:48:41, 6.92s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:14:33<32:48:41, 6.92s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:39,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:39,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7419, 'learning_rate': 2.2800000000000002e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:39,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:39,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:39,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 761/17840 [1:14:47<32:56:08, 6.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:49,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:49,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:12:49,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:14:54<32:54:01, 6.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:14:54<32:54:01, 6.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:14:54<32:54:01, 6.94s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:00,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:00,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6298, 'learning_rate': 2.289e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:00,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:00,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:00,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:15:07<32:43:22, 6.90s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:10,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:10,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:15:14<32:40:20, 6.89s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:15:14<32:40:20, 6.89s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7393, 'learning_rate': 2.2950000000000002e-05, 'epoch': 0.86} + 4%|███▏ | 765/17840 [1:15:14<32:40:20, 6.89s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:15:14<32:40:20, 6.89s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:15:14<32:40:20, 6.89s/it]g-point operations will not be computed-15 21:11:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:15:21<32:26:59, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:15:21<32:26:59, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:15:21<32:26:59, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:15:21<32:26:59, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:15:28<32:13:20, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:30,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:30,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:15:34<32:00:24, 6.75s/it]g-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:15:34<32:00:24, 6.75s/it]g-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7058, 'learning_rate': 2.304e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:39,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:15:41<31:49:55, 6.71s/it]g-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:15:41<31:49:55, 6.71s/it]g-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7976, 'learning_rate': 2.307e-05, 'epoch': 0.86} + 4%|███▏ | 769/17840 [1:15:41<31:49:55, 6.71s/it]g-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6633, 'learning_rate': 2.3100000000000002e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:13:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:22,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:15:54<31:32:34, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:15:54<31:32:34, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:15:54<31:32:34, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 772/17840 [1:16:01<31:22:35, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 772/17840 [1:16:01<31:22:35, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:03,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:03,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:16:07<31:23:35, 6.62s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:16:07<31:23:35, 6.62s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7989, 'learning_rate': 2.319e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:11,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:16:14<31:07:44, 6.57s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:16:14<31:07:44, 6.57s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6196, 'learning_rate': 2.322e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:18,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 775/17840 [1:16:22<32:46:50, 6.92s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 775/17840 [1:16:22<32:46:50, 6.92s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:24,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:24,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 776/17840 [1:16:28<32:12:48, 6.80s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 776/17840 [1:16:28<32:12:48, 6.80s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6464, 'learning_rate': 2.328e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:32,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:32,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 777/17840 [1:16:34<31:27:20, 6.64s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 777/17840 [1:16:34<31:27:20, 6.64s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:38,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:38,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:16:41<30:49:39, 6.50s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:16:41<30:49:39, 6.50s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:44,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:44,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 779/17840 [1:16:47<30:20:51, 6.40s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 779/17840 [1:16:47<30:20:51, 6.40s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:50,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:50,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 780/17840 [1:16:53<29:55:33, 6.31s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 780/17840 [1:16:53<29:55:33, 6.31s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:57,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:14:57,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:16:59<29:32:03, 6.23s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:16:59<29:32:03, 6.23s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:03,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:03,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:17:05<29:13:00, 6.17s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:07,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:07,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:07,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:17:11<28:57:12, 6.11s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:17:11<28:57:12, 6.11s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:14,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:14,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 784/17840 [1:17:17<28:28:10, 6.01s/it]g-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:19,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:19,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:19,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:13:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 785/17840 [1:17:22<27:58:33, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:26,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 786/17840 [1:17:28<27:35:28, 5.82s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 786/17840 [1:17:28<27:35:28, 5.82s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6837, 'learning_rate': 2.358e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:31,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 787/17840 [1:17:33<27:07:16, 5.73s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 787/17840 [1:17:33<27:07:16, 5.73s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:35,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:38,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:38,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7322, 'learning_rate': 2.364e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:42,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 789/17840 [1:17:44<26:07:11, 5.51s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 789/17840 [1:17:44<26:07:11, 5.51s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:46,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:48,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:48,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6129, 'learning_rate': 2.37e-05, 'epoch': 0.89} +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:52,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 791/17840 [1:17:54<25:00:24, 5.28s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 791/17840 [1:17:54<25:00:24, 5.28s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:56,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:58,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:15:58,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4656, 'learning_rate': 2.3760000000000003e-05, 'epoch': 0.89} + 4%|███▎ | 793/17840 [1:18:03<23:24:48, 4.94s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 793/17840 [1:18:03<23:24:48, 4.94s/it]g-point operations will not be computed-15 21:15:23,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 793/17840 [1:18:03<23:24:48, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:04,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 794/17840 [1:18:08<22:14:20, 4.70s/it]g-point operations will not be computed-15 21:16:04,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 794/17840 [1:18:08<22:14:20, 4.70s/it]g-point operations will not be computed-15 21:16:04,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 794/17840 [1:18:08<22:14:20, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:08,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 795/17840 [1:18:11<20:49:18, 4.40s/it]g-point operations will not be computed-15 21:16:08,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 795/17840 [1:18:11<20:49:18, 4.40s/it]g-point operations will not be computed-15 21:16:08,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 795/17840 [1:18:11<20:49:18, 4.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:11,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 796/17840 [1:18:15<19:24:42, 4.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:15,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 796/17840 [1:18:15<19:24:42, 4.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:15,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 797/17840 [1:18:18<17:51:42, 3.77s/it]g-point operations will not be computed-15 21:16:15,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 797/17840 [1:18:18<17:51:42, 3.77s/it]g-point operations will not be computed-15 21:16:15,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:19,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:18,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 798/17840 [1:18:20<16:21:49, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:20,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 798/17840 [1:18:20<16:21:49, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:20,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 799/17840 [1:18:23<14:56:09, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:23,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 799/17840 [1:18:23<14:56:09, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:23,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:24,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:23,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:18:26<15:07:32, 3.20s/it]g-point operations will not be computed-15 21:16:23,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:18:26<15:07:32, 3.20s/it]g-point operations will not be computed-15 21:16:23,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:18:26<15:07:32, 3.20s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:28,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:18:26<15:07:32, 3.20s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:28,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:31,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:28,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:31,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:28,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:18:34<21:43:00, 4.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:18:34<21:43:00, 4.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:39,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:39,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:18:41<25:36:13, 5.41s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:18:41<25:36:13, 5.41s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:18:41<25:36:13, 5.41s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:18:41<25:36:13, 5.41s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:18:41<25:36:13, 5.41s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:18:48<28:07:19, 5.94s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:51,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:51,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:16:51,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:18:56<29:52:18, 6.31s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:18:56<29:52:18, 6.31s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:18:56<29:52:18, 6.31s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:18:56<29:52:18, 6.31s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:18:56<29:52:18, 6.31s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:19:03<31:01:45, 6.56s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:05,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:05,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:05,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:19:10<31:41:00, 6.70s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:19:10<31:41:00, 6.70s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:19:10<31:41:00, 6.70s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7602, 'learning_rate': 2.4210000000000004e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:19:24<32:22:54, 6.84s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:19:24<32:22:54, 6.84s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:19:24<32:22:54, 6.84s/it]g-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:30,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:30,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7044, 'learning_rate': 2.4270000000000003e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:30,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:30,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:30,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:16:35,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:19:38<32:24:39, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:19:38<32:24:39, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:19:38<32:24:39, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:19:38<32:24:39, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 811/17840 [1:19:44<32:15:49, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:19:51<32:14:56, 6.82s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:19:51<32:14:56, 6.82s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:19:51<32:14:56, 6.82s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:57,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:57,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5942, 'learning_rate': 2.439e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:57,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:57,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:17:57,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:20:05<32:02:16, 6.77s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:07,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:07,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:20:11<31:50:43, 6.73s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:20:11<31:50:43, 6.73s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6793, 'learning_rate': 2.4449999999999998e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:15,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:20:18<31:44:21, 6.71s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:20:18<31:44:21, 6.71s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6221, 'learning_rate': 2.448e-05, 'epoch': 0.91} + 5%|███▍ | 816/17840 [1:20:18<31:44:21, 6.71s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:24,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:24,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7447, 'learning_rate': 2.4509999999999997e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:24,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:24,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:24,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:20:31<31:18:43, 6.62s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:33,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:33,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 819/17840 [1:20:37<31:12:54, 6.60s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 819/17840 [1:20:37<31:12:54, 6.60s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:40,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:40,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:20:44<31:02:15, 6.56s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:20:44<31:02:15, 6.56s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7146, 'learning_rate': 2.4599999999999998e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:48,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:20:50<30:54:09, 6.54s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:20:50<30:54:09, 6.54s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7183, 'learning_rate': 2.463e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-15 21:18:54,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:20:57<30:35:13, 6.47s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:20:57<30:35:13, 6.47s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5901, 'learning_rate': 2.4659999999999998e-05, 'epoch': 0.92} + 5%|███▍ | 822/17840 [1:20:57<30:35:13, 6.47s/it]g-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:02,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:02,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7405, 'learning_rate': 2.469e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:02,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:02,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:02,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:17:38,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:21:09<30:07:15, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:21:09<30:07:15, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:21:09<30:07:15, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:21:17<31:46:28, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:21:17<31:46:28, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.868, 'learning_rate': 2.475e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:21,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 826/17840 [1:21:23<31:07:30, 6.59s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 826/17840 [1:21:23<31:07:30, 6.59s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7735, 'learning_rate': 2.478e-05, 'epoch': 0.93} + 5%|███▍ | 826/17840 [1:21:23<31:07:30, 6.59s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:28,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:28,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6145, 'learning_rate': 2.4809999999999998e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:33,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 828/17840 [1:21:35<29:53:35, 6.33s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 828/17840 [1:21:35<29:53:35, 6.33s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5194, 'learning_rate': 2.484e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:39,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:21:41<29:31:46, 6.25s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:21:41<29:31:46, 6.25s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5678, 'learning_rate': 2.487e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:45,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 830/17840 [1:21:47<29:11:39, 6.18s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 830/17840 [1:21:47<29:11:39, 6.18s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6363, 'learning_rate': 2.49e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:51,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:21:53<29:04:51, 6.16s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:21:53<29:04:51, 6.16s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5251, 'learning_rate': 2.493e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-15 21:19:57,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:21:59<28:46:15, 6.09s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:21:59<28:46:15, 6.09s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:02,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:02,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:02,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:22:05<28:35:16, 6.05s/it]g-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:19:10,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:22:11<28:07:30, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:22:11<28:07:30, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:16,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:16,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6031, 'learning_rate': 2.505e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:20,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:20,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███��� | 836/17840 [1:22:22<27:12:00, 5.76s/it]g-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 837/17840 [1:22:28<26:41:48, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 837/17840 [1:22:28<26:41:48, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 837/17840 [1:22:28<26:41:48, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:32,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:32,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:36,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:36,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 839/17840 [1:22:38<25:39:03, 5.43s/it]g-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:40,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:40,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:42,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:44,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:47,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:47,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7463, 'learning_rate': 2.523e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:50,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:50,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:28,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 842/17840 [1:22:52<22:49:05, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:52,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:54,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:52,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:20:54,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:20:52,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 843/17840 [1:22:56<21:33:36, 4.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:56,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 843/17840 [1:22:56<21:33:36, 4.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:20:56,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 844/17840 [1:23:00<20:24:45, 4.32s/it]g-point operations will not be computed-15 21:20:56,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 844/17840 [1:23:00<20:24:45, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:00,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 844/17840 [1:23:00<20:24:45, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:00,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 845/17840 [1:23:03<18:58:47, 4.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:03,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:04,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:03,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:04,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:03,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 846/17840 [1:23:06<17:37:24, 3.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 846/17840 [1:23:06<17:37:24, 3.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 847/17840 [1:23:09<16:14:46, 3.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:09,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 847/17840 [1:23:09<16:14:46, 3.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:09,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 848/17840 [1:23:11<14:57:12, 3.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:11,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 848/17840 [1:23:11<14:57:12, 3.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:11,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 849/17840 [1:23:14<13:46:20, 2.92s/it]g-point operations will not be computed-15 21:21:11,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:14,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:13,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:14,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:13,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:23:17<14:15:21, 3.02s/it]g-point operations will not be computed-15 21:21:13,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:23:17<14:15:21, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:18,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:23:17<14:15:21, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:18,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:22,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:18,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:22,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:18,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:23:24<20:42:06, 4.39s/it]g-point operations will not be computed-15 21:21:18,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:23:24<20:42:06, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:25,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:29,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:25,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:23:32<25:04:48, 5.31s/it]g-point operations will not be computed-15 21:21:25,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:23:32<25:04:48, 5.31s/it]g-point operations will not be computed-15 21:21:25,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:23:32<25:04:48, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:23:32<25:04:48, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:23:32<25:04:48, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:23:32<25:04:48, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:23:39<27:50:30, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:23:39<27:50:30, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:23:39<27:50:30, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:45,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:45,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9454, 'learning_rate': 2.562e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:45,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:45,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:21:45,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:23:53<30:53:05, 6.55s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:23:53<30:53:05, 6.55s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:23:53<30:53:05, 6.55s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:00,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:00,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.79, 'learning_rate': 2.568e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:00,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:00,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:00,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:24:07<31:57:08, 6.77s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:10,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:10,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:10,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:24:14<32:08:28, 6.81s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:24:14<32:08:28, 6.81s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:24:14<32:08:28, 6.81s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:20,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:20,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.493, 'learning_rate': 2.577e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:20,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:20,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:20,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:24:28<32:17:02, 6.84s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:24:28<32:17:02, 6.84s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:32,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:24:35<32:17:20, 6.85s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:24:35<32:17:20, 6.85s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8028, 'learning_rate': 2.5830000000000002e-05, 'epoch': 0.97} + 5%|███▌ | 861/17840 [1:24:35<32:17:20, 6.85s/it]g-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:41,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:41,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6868, 'learning_rate': 2.586e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:41,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:41,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:41,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:21:33,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:24:48<32:03:11, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:24:48<32:03:11, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:24:48<32:03:11, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 864/17840 [1:24:55<31:52:46, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 864/17840 [1:24:55<31:52:46, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8055, 'learning_rate': 2.592e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-15 21:22:59,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 865/17840 [1:25:02<31:47:44, 6.74s/it]g-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 865/17840 [1:25:02<31:47:44, 6.74s/it]g-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7054, 'learning_rate': 2.595e-05, 'epoch': 0.97} + 5%|███▌ | 865/17840 [1:25:02<31:47:44, 6.74s/it]g-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:08,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:08,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5415, 'learning_rate': 2.5980000000000002e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:08,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:08,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:08,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:22:49,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:25:15<31:26:00, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:25:15<31:26:00, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:25:15<31:26:00, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:25:22<31:16:22, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:25:22<31:16:22, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:24,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:24,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:25:28<31:06:39, 6.60s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:25:28<31:06:39, 6.60s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:25:35<30:49:46, 6.54s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:25:35<30:49:46, 6.54s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5725, 'learning_rate': 2.61e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:39,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:39,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:25:41<30:38:58, 6.50s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:25:41<30:38:58, 6.50s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:45,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:45,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 872/17840 [1:25:47<30:20:03, 6.44s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 872/17840 [1:25:47<30:20:03, 6.44s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 872/17840 [1:25:47<30:20:03, 6.44s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 872/17840 [1:25:47<30:20:03, 6.44s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:53,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:53,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:57,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:23:57,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:26:00<29:52:08, 6.34s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:26:00<29:52:08, 6.34s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:26:00<29:52:08, 6.34s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:26:00<29:52:08, 6.34s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:26:00<29:52:08, 6.34s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:26:07<31:28:34, 6.68s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:26:07<31:28:34, 6.68s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:11,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:11,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:26:13<30:45:34, 6.53s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:26:13<30:45:34, 6.53s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:17,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:17,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 877/17840 [1:26:19<29:59:40, 6.37s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:22,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:22,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:22,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:26:25<29:19:45, 6.22s/it]g-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:27,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:27,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:27,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:23:16,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 879/17840 [1:26:31<28:49:15, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 879/17840 [1:26:31<28:49:15, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:36,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:36,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7329, 'learning_rate': 2.64e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:40,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:40,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 881/17840 [1:26:42<27:33:17, 5.85s/it]g-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 881/17840 [1:26:42<27:33:17, 5.85s/it]g-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:46,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:46,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:26:48<27:01:35, 5.74s/it]g-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:50,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:52,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:52,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4379, 'learning_rate': 2.6490000000000002e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:56,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:24:56,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:32,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 884/17840 [1:26:58<25:19:57, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:01,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:01,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 885/17840 [1:27:02<24:10:14, 5.13s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:04,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:06,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:06,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:08,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:10,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:10,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:12,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:12,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:13,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:17,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:17,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:18,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:18,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:21,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:21,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:23,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:23,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:24,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:24,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:28,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:28,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:28,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:32,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:32,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:35,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.227, 'learning_rate': 2.682e-05, 'epoch': 1.0} +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:27:47<27:29:02, 5.84s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:27:47<27:29:02, 5.84s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:25:52,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:27:54<29:19:12, 6.23s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:27:54<29:19:12, 6.23s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.822, 'learning_rate': 2.688e-05, 'epoch': 1.0} + 5%|███▋ | 896/17840 [1:27:54<29:19:12, 6.23s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:27:54<29:19:12, 6.23s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:27:54<29:19:12, 6.23s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:28:01<30:33:48, 6.49s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:28:01<30:33:48, 6.49s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:28:01<30:33:48, 6.49s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:08,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:08,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7973, 'learning_rate': 2.6940000000000003e-05, 'epoch': 1.01} +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:08,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:08,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:08,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:28:15<31:59:18, 6.80s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:28:15<31:59:18, 6.80s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:20,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:20,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:28:24<34:10:07, 7.26s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:28:24<34:10:07, 7.26s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:28,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:28:31<33:42:52, 7.17s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:28:31<33:42:52, 7.17s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7611, 'learning_rate': 2.703e-05, 'epoch': 1.01} + 5%|███▋ | 901/17840 [1:28:31<33:42:52, 7.17s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:28:31<33:42:52, 7.17s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:28:31<33:42:52, 7.17s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:28:38<33:22:03, 7.09s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:40,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:40,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:28:45<33:01:53, 7.02s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:28:45<33:01:53, 7.02s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4084, 'learning_rate': 2.709e-05, 'epoch': 1.01} + 5%|███▋ | 903/17840 [1:28:45<33:01:53, 7.02s/it]g-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:51,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:51,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5845, 'learning_rate': 2.712e-05, 'epoch': 1.01} +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:51,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:51,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:26:51,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:24:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:28:58<32:27:20, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:28:58<32:27:20, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:28:58<32:27:20, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:29:05<32:13:08, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:29:05<32:13:08, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:07,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:07,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:29:12<31:59:44, 6.80s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:29:12<31:59:44, 6.80s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7248, 'learning_rate': 2.7210000000000002e-05, 'epoch': 1.02} + 5%|███▊ | 907/17840 [1:29:12<31:59:44, 6.80s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:17,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:17,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7341, 'learning_rate': 2.724e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:17,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:17,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:29:25<31:39:42, 6.73s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:29:25<31:39:42, 6.73s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:27,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:27,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:29:31<31:30:11, 6.70s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:29:31<31:30:11, 6.70s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3934, 'learning_rate': 2.7300000000000003e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:36,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:29:38<31:12:10, 6.64s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:29:38<31:12:10, 6.64s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.458, 'learning_rate': 2.733e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:42,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:29:44<30:59:27, 6.59s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:29:44<30:59:27, 6.59s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4828, 'learning_rate': 2.7360000000000002e-05, 'epoch': 1.02} + 5%|███▊ | 912/17840 [1:29:44<30:59:27, 6.59s/it]g-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:50,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:50,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.578, 'learning_rate': 2.739e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:50,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:57,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:57,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6104, 'learning_rate': 2.7420000000000002e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:57,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:57,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:27:57,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:26:59,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:30:04<30:32:46, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:30:04<30:32:46, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:30:04<30:32:46, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:30:04<30:32:46, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:30:10<30:21:41, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:13,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:13,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:13,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:30:17<30:13:22, 6.43s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:30:17<30:13:22, 6.43s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:20,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:20,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 918/17840 [1:30:23<29:59:45, 6.38s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 918/17840 [1:30:23<29:59:45, 6.38s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:27,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:27,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:30:29<29:45:49, 6.33s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:30:29<29:45:49, 6.33s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:33,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:33,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:30:35<29:43:19, 6.32s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:30:35<29:43:19, 6.32s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:39,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:39,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 921/17840 [1:30:41<29:26:08, 6.26s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 921/17840 [1:30:41<29:26:08, 6.26s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:45,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:45,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 922/17840 [1:30:47<29:06:37, 6.19s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 922/17840 [1:30:47<29:06:37, 6.19s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:51,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:51,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 923/17840 [1:30:54<28:54:46, 6.15s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 923/17840 [1:30:54<28:54:46, 6.15s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:57,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:28:57,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 924/17840 [1:31:00<28:41:39, 6.11s/it]g-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:02,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:02,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:02,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:28:05,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:31:07<30:16:54, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:31:07<30:16:54, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4846, 'learning_rate': 2.778e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:18,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:18,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5343, 'learning_rate': 2.7810000000000003e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:22,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:22,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 928/17840 [1:31:24<28:04:21, 5.98s/it]g-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:26,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:26,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:26,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:08,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:31:30<27:28:31, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:31:30<27:28:31, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:34,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:34,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.694, 'learning_rate': 2.79e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:38,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:38,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 931/17840 [1:31:40<26:14:48, 5.59s/it]g-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:42,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:42,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:42,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:30,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 932/17840 [1:31:45<25:31:43, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:48,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:48,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 933/17840 [1:31:50<24:49:41, 5.29s/it]g-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:52,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:52,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:54,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:56,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:58,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:29:58,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:01,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:03,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:03,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:05,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:06,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:06,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:08,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:08,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:10,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:13,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:13,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:14,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:14,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:17,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:17,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:19,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:19,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:20,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:20,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:24,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:27,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:27,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8214, 'learning_rate': 2.829e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:31,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:31,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:35,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:35,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7267, 'learning_rate': 2.832e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:35,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:35,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:35,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:32:43<27:07:30, 5.78s/it]g-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:46,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:30:46,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:32:50<29:04:08, 6.19s/it]g-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:32:50<29:04:08, 6.19s/it]g-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7203, 'learning_rate': 2.838e-05, 'epoch': 1.06} + 5%|███▉ | 946/17840 [1:32:50<29:04:08, 6.19s/it]g-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:32:50<29:04:08, 6.19s/it]g-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:32:50<29:04:08, 6.19s/it]g-point operations will not be computed-15 21:29:46,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:57<30:18:03, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:57<30:18:03, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:57<30:18:03, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:33:04<31:11:56, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:33:04<31:11:56, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7603, 'learning_rate': 2.844e-05, 'epoch': 1.06} + 5%|███▉ | 948/17840 [1:33:04<31:11:56, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:10,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:10,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6054, 'learning_rate': 2.847e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:10,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:10,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:33:20<34:00:57, 7.25s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:33:20<34:00:57, 7.25s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7108, 'learning_rate': 2.8499999999999998e-05, 'epoch': 1.07} + 5%|███▉ | 950/17840 [1:33:20<34:00:57, 7.25s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:33:20<34:00:57, 7.25s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 951/17840 [1:33:27<33:42:48, 7.19s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 951/17840 [1:33:27<33:42:48, 7.19s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3223, 'learning_rate': 2.853e-05, 'epoch': 1.07} + 5%|███▉ | 951/17840 [1:33:27<33:42:48, 7.19s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:33,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:33,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5932, 'learning_rate': 2.856e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:33,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:33,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:33:40<33:05:40, 7.06s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:33:40<33:05:40, 7.06s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:33:47<32:57:12, 7.03s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:33:47<32:57:12, 7.03s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4184, 'learning_rate': 2.862e-05, 'epoch': 1.07} + 5%|███▉ | 954/17840 [1:33:47<32:57:12, 7.03s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7351, 'learning_rate': 2.865e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:31:53,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:34:01<32:24:24, 6.91s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:34:01<32:24:24, 6.91s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5592, 'learning_rate': 2.868e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:05,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:05,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:34:08<32:06:20, 6.85s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:34:08<32:06:20, 6.85s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:12,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:12,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:34:14<31:56:01, 6.81s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:34:14<31:56:01, 6.81s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:34:14<31:56:01, 6.81s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:20,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:20,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6429, 'learning_rate': 2.877e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:20,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:20,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:20,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:34:28<31:28:33, 6.71s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:30,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:30,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:30,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:34:34<31:13:49, 6.66s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:34:34<31:13:49, 6.66s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:38,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:38,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:34:41<31:14:08, 6.66s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:34:41<31:14:08, 6.66s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:34:41<31:14:08, 6.66s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:34:41<31:14:08, 6.66s/it]g-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:47,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:47,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:47,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:53,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:53,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4922, 'learning_rate': 2.892e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:53,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:32:53,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:30:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:35:00<30:34:09, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:35:00<30:34:09, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4355, 'learning_rate': 2.895e-05, 'epoch': 1.08} + 5%|████ | 965/17840 [1:35:00<30:34:09, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 966/17840 [1:35:07<30:18:16, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 966/17840 [1:35:07<30:18:16, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:09,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:09,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:35:13<30:04:06, 6.42s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:35:13<30:04:06, 6.42s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:15,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:15,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:35:19<29:45:36, 6.35s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:35:19<29:45:36, 6.35s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:21,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:21,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:35:25<29:30:07, 6.30s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:35:25<29:30:07, 6.30s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:28,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:28,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 970/17840 [1:35:31<29:16:18, 6.25s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 970/17840 [1:35:31<29:16:18, 6.25s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:34,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:34,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 971/17840 [1:35:38<29:11:33, 6.23s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 971/17840 [1:35:38<29:11:33, 6.23s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:40,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:40,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:35:44<29:00:57, 6.19s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:35:44<29:00:57, 6.19s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4708, 'learning_rate': 2.916e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 973/17840 [1:35:50<28:46:32, 6.14s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 973/17840 [1:35:50<28:46:32, 6.14s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:52,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:52,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:35:56<28:21:01, 6.05s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:35:56<28:21:01, 6.05s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:58,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:33:58,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:36:03<29:52:30, 6.38s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:36:03<29:52:30, 6.38s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3999, 'learning_rate': 2.925e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:06,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 976/17840 [1:36:09<29:07:41, 6.22s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 976/17840 [1:36:09<29:07:41, 6.22s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:11,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:11,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 977/17840 [1:36:14<28:19:29, 6.05s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 977/17840 [1:36:14<28:19:29, 6.05s/it]g-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:16,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:16,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:33:01,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:36:20<27:44:43, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:36:20<27:44:43, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3126, 'learning_rate': 2.934e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:25,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:25,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4723, 'learning_rate': 2.9370000000000002e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:29,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 980/17840 [1:36:31<26:27:12, 5.65s/it]g-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 980/17840 [1:36:31<26:27:12, 5.65s/it]g-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:32,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:35,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:35,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3614, 'learning_rate': 2.943e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:39,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:39,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:20,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 982/17840 [1:36:41<24:46:09, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 982/17840 [1:36:41<24:46:09, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 982/17840 [1:36:41<24:46:09, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:44,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:47,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:47,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:49,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:51,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:51,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:53,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:55,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:55,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:57,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:58,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:34:58,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:00,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:00,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:03,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:04,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:04,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:07,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:07,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:08,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:08,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:10,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:10,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:16,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:16,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:16,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:20,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:20,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:24,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:24,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:27,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:27,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:31,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:31,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:31,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 995/17840 [1:37:35<26:41:56, 5.71s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 995/17840 [1:37:35<26:41:56, 5.71s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 995/17840 [1:37:35<26:41:56, 5.71s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:42,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:42,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8066, 'learning_rate': 2.9880000000000002e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:42,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:42,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:42,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:37:49<29:56:17, 6.40s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:52,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:52,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:35:52,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:37:56<30:47:10, 6.58s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:37:56<30:47:10, 6.58s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:37:56<30:47:10, 6.58s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:37:56<30:47:10, 6.58s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:37:56<30:47:10, 6.58s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:38:03<31:19:29, 6.70s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:06,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:06,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:06,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:38:12<33:38:41, 7.19s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:15,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:15,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:38:19<33:30:30, 7.16s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:38:19<33:30:30, 7.16s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5312, 'learning_rate': 2.9998218527315912e-05, 'epoch': 1.12} + 6%|████ | 1001/17840 [1:38:19<33:30:30, 7.16s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:25,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:25,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5694, 'learning_rate': 2.999643705463183e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:25,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:25,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:25,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:38:32<32:34:48, 6.97s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:38:32<32:34:48, 6.97s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:37,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1004/17840 [1:38:39<32:21:49, 6.92s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1004/17840 [1:38:39<32:21:49, 6.92s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.612, 'learning_rate': 2.999287410926366e-05, 'epoch': 1.13} + 6%|████ | 1004/17840 [1:38:39<32:21:49, 6.92s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:45,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:45,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6578, 'learning_rate': 2.999109263657957e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:45,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:45,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:45,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:38:53<31:58:57, 6.84s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:55,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:36:55,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:38:59<31:47:45, 6.80s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:38:59<31:47:45, 6.80s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4283, 'learning_rate': 2.99875296912114e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:04,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:39:06<31:35:57, 6.76s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:39:06<31:35:57, 6.76s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4972, 'learning_rate': 2.998574821852732e-05, 'epoch': 1.13} + 6%|████ | 1008/17840 [1:39:06<31:35:57, 6.76s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:12,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:12,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4326, 'learning_rate': 2.998396674584323e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:12,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:12,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:12,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:39:19<31:12:45, 6.68s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:22,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:22,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:39:26<31:04:23, 6.65s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:39:26<31:04:23, 6.65s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:28,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:28,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:39:32<30:59:19, 6.63s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:39:32<30:59:19, 6.63s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6071, 'learning_rate': 2.9978622327790974e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:36,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:39:39<30:45:06, 6.58s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:39:39<30:45:06, 6.58s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3439, 'learning_rate': 2.997684085510689e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-15 21:37:43,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:39:45<30:34:32, 6.54s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:39:45<30:34:32, 6.54s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5021, 'learning_rate': 2.9975059382422804e-05, 'epoch': 1.14} + 6%|████▏ | 1014/17840 [1:39:45<30:34:32, 6.54s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:39:45<30:34:32, 6.54s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:39:45<30:34:32, 6.54s/it]g-point operations will not be computed-15 21:34:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1015/17840 [1:39:52<30:29:16, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:53,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1015/17840 [1:39:52<30:29:16, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:53,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1015/17840 [1:39:52<30:29:16, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:53,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:39:58<30:19:34, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:39:58<30:19:34, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4489, 'learning_rate': 2.9971496437054633e-05, 'epoch': 1.14} + 6%|████▏ | 1016/17840 [1:39:58<30:19:34, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1017/17840 [1:40:05<30:06:57, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1017/17840 [1:40:05<30:06:57, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:07,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:07,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1018/17840 [1:40:11<29:56:37, 6.41s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1018/17840 [1:40:11<29:56:37, 6.41s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:13,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:13,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:40:17<29:46:23, 6.37s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:40:17<29:46:23, 6.37s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:20,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:20,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:40:23<29:36:51, 6.34s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:40:23<29:36:51, 6.34s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:26,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:26,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:26,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1021/17840 [1:40:30<29:23:57, 6.29s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:32,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:32,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:32,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1022/17840 [1:40:36<29:11:29, 6.25s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:38,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:38,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:38,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1023/17840 [1:40:42<28:55:10, 6.19s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:44,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:44,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:44,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1024/17840 [1:40:48<28:36:28, 6.12s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:50,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:50,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:40:55<30:08:33, 6.45s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:40:55<30:08:33, 6.45s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.266, 'learning_rate': 2.9955463182897863e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:59,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:38:59,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1026/17840 [1:41:01<29:21:25, 6.29s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:03,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:03,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:03,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1027/17840 [1:41:07<28:35:19, 6.12s/it]g-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:09,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:09,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:09,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:37:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1028/17840 [1:41:12<27:55:00, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1028/17840 [1:41:12<27:55:00, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:17,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:17,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1725, 'learning_rate': 2.9948337292161522e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:21,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:21,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1030/17840 [1:41:23<26:37:39, 5.70s/it]g-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:25,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:25,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:25,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:13,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1031/17840 [1:41:28<25:56:18, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1031/17840 [1:41:28<25:56:18, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:41:33<25:09:58, 5.39s/it]g-point operations will not be computed-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:41:33<25:09:58, 5.39s/it]g-point operations will not be computed-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:35,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:37,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:37,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.382, 'learning_rate': 2.994121140142518e-05, 'epoch': 1.16} +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:41,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:41,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:29,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1034/17840 [1:41:43<23:32:44, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:43,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:45,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:43,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:45,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:43,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1035/17840 [1:41:47<22:29:23, 4.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:49,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:49,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1036/17840 [1:41:51<21:21:13, 4.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:51,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:53,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:51,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:53,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:51,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1037/17840 [1:41:55<20:02:01, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:39:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1038/17840 [1:41:58<18:29:48, 3.96s/it]g-point operations will not be computed-15 21:39:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1038/17840 [1:41:58<18:29:48, 3.96s/it]g-point operations will not be computed-15 21:39:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:59,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:58,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:39:59,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:39:58,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1039/17840 [1:42:01<17:00:55, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:01,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1040/17840 [1:42:04<15:37:16, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:03,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1040/17840 [1:42:04<15:37:16, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:03,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1041/17840 [1:42:06<14:15:37, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:06,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1041/17840 [1:42:06<14:15:37, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:06,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:42:08<12:59:05, 2.78s/it]g-point operations will not be computed-15 21:40:06,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:42:08<12:59:05, 2.78s/it]g-point operations will not be computed-15 21:40:06,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:42:08<12:59:05, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:09,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:42:08<12:59:05, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:09,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:13,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:09,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:13,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:09,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1043/17840 [1:42:16<19:38:46, 4.21s/it]g-point operations will not be computed-15 21:40:09,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1043/17840 [1:42:16<19:38:46, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:17,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1043/17840 [1:42:16<19:38:46, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:17,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:20,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:17,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:20,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:17,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1044/17840 [1:42:23<23:51:42, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1044/17840 [1:42:23<23:51:42, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1044/17840 [1:42:23<23:51:42, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1044/17840 [1:42:23<23:51:42, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:42:30<26:49:40, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:42:30<26:49:40, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:42:30<26:49:40, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:42:30<26:49:40, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:42:30<26:49:40, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:24,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:42:37<28:51:02, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:42:37<28:51:02, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:42:37<28:51:02, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:42:44<30:05:10, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:42:44<30:05:10, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6957, 'learning_rate': 2.991627078384798e-05, 'epoch': 1.17} + 6%|████▎ | 1047/17840 [1:42:44<30:05:10, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:51,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:51,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5444, 'learning_rate': 2.99144893111639e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:51,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:51,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:40:51,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:42:58<31:30:48, 6.76s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:42:58<31:30:48, 6.76s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:03,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:43:07<33:37:29, 7.21s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:43:07<33:37:29, 7.21s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5081, 'learning_rate': 2.9910926365795728e-05, 'epoch': 1.18} + 6%|████▎ | 1050/17840 [1:43:07<33:37:29, 7.21s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:13,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:13,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4092, 'learning_rate': 2.990914489311164e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:13,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:13,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:13,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:43:21<33:08:48, 7.11s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:23,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:23,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:43:28<32:52:25, 7.05s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:43:28<32:52:25, 7.05s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5077, 'learning_rate': 2.990558194774347e-05, 'epoch': 1.18} + 6%|████▎ | 1053/17840 [1:43:28<32:52:25, 7.05s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:43:28<32:52:25, 7.05s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:43:28<32:52:25, 7.05s/it]g-point operations will not be computed-15 21:40:38,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:43:35<32:31:38, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:43:35<32:31:38, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:43:35<32:31:38, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1055/17840 [1:43:41<32:20:25, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1055/17840 [1:43:41<32:20:25, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4138, 'learning_rate': 2.99020190023753e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-15 21:41:46,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:43:48<32:13:00, 6.91s/it]g-point operations will not be computed-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:43:48<32:13:00, 6.91s/it]g-point operations will not be computed-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3928, 'learning_rate': 2.990023752969121e-05, 'epoch': 1.18} + 6%|████▎ | 1056/17840 [1:43:48<32:13:00, 6.91s/it]g-point operations will not be computed-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:43:48<32:13:00, 6.91s/it]g-point operations will not be computed-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:43:48<32:13:00, 6.91s/it]g-point operations will not be computed-15 21:41:35,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:43:55<31:52:39, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:43:55<31:52:39, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:43:55<31:52:39, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:44:02<31:37:57, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:44:02<31:37:57, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:04,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:04,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1059/17840 [1:44:08<31:24:18, 6.74s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1059/17840 [1:44:08<31:24:18, 6.74s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3725, 'learning_rate': 2.9894893111638958e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:12,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1060/17840 [1:44:15<31:07:34, 6.68s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1060/17840 [1:44:15<31:07:34, 6.68s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3836, 'learning_rate': 2.989311163895487e-05, 'epoch': 1.19} + 6%|████▎ | 1060/17840 [1:44:15<31:07:34, 6.68s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:20,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:20,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4124, 'learning_rate': 2.9891330166270787e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:20,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:20,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:44:28<30:54:43, 6.63s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:44:28<30:54:43, 6.63s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:30,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:30,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:44:34<30:44:59, 6.60s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:44:34<30:44:59, 6.60s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.39, 'learning_rate': 2.9887767220902613e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:39,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:44:41<30:37:43, 6.57s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:44:41<30:37:43, 6.57s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4282, 'learning_rate': 2.9885985748218528e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:45,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1065/17840 [1:44:47<30:30:14, 6.55s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1065/17840 [1:44:47<30:30:14, 6.55s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4913, 'learning_rate': 2.9884204275534443e-05, 'epoch': 1.19} + 6%|████▎ | 1065/17840 [1:44:47<30:30:14, 6.55s/it]g-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:53,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:53,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4102, 'learning_rate': 2.9882422802850357e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:53,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:59,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:59,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3255, 'learning_rate': 2.9880641330166272e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:59,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:42:59,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:41:56,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:45:06<29:48:12, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:07,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:45:06<29:48:12, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:07,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3288, 'learning_rate': 2.9878859857482187e-05, 'epoch': 1.2} + 6%|████▎ | 1068/17840 [1:45:06<29:48:12, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:07,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:45:06<29:48:12, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:07,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:45:13<29:31:31, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:13,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:45:13<29:31:31, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:13,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:45:13<29:31:31, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:13,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:45:13<29:31:31, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:13,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:45:19<29:19:54, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:45:19<29:19:54, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:24,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:24,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4032, 'learning_rate': 2.9873515439429928e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:24,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:30,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:30,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5003, 'learning_rate': 2.9871733966745846e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:30,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:36,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:36,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3466, 'learning_rate': 2.9869952494061757e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:36,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:42,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:42,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2532, 'learning_rate': 2.9868171021377672e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:47,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:47,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:45:50<29:53:53, 6.42s/it]g-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:52,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:52,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:43:52,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:20,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1076/17840 [1:45:56<29:06:44, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1076/17840 [1:45:56<29:06:44, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:01,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:01,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3008, 'learning_rate': 2.9862826603325416e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:01,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:07,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:07,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:09,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:09,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:09,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:46:13<26:56:55, 5.79s/it]g-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:15,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:17,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:17,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3923, 'learning_rate': 2.985748218527316e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:21,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:46:23<25:40:12, 5.51s/it]g-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:46:23<25:40:12, 5.51s/it]g-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:25,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:27,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:27,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4321, 'learning_rate': 2.985391923990499e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:31,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:31,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:43:57,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1083/17840 [1:46:33<23:59:03, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:33,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:36,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:33,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:36,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:33,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1084/17840 [1:46:38<23:07:06, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:38,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:40,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:38,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:40,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:38,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1085/17840 [1:46:42<22:03:03, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:42,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:44,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:42,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:44,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:42,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:46:46<20:53:45, 4.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:46,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:48,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:46,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:48,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:46,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:46:49<19:40:50, 4.23s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:49,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1088/17840 [1:46:53<18:19:08, 3.94s/it]g-point operations will not be computed-15 21:44:49,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1088/17840 [1:46:53<18:19:08, 3.94s/it]g-point operations will not be computed-15 21:44:49,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:54,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:53,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:44:54,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:44:53,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1089/17840 [1:46:56<17:04:20, 3.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:56,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1090/17840 [1:46:58<15:48:22, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:58,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1090/17840 [1:46:58<15:48:22, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:44:58,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1091/17840 [1:47:01<14:31:39, 3.12s/it]g-point operations will not be computed-15 21:44:58,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1091/17840 [1:47:01<14:31:39, 3.12s/it]g-point operations will not be computed-15 21:44:58,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:47:03<13:19:27, 2.86s/it]g-point operations will not be computed-15 21:45:01,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:47:03<13:19:27, 2.86s/it]g-point operations will not be computed-15 21:45:01,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:47:03<13:19:27, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:45:04,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:47:03<13:19:27, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:45:04,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:45:08,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:04,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:47:11<19:56:32, 4.29s/it]g-point operations will not be computed-15 21:45:04,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:47:11<19:56:32, 4.29s/it]g-point operations will not be computed-15 21:45:04,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:47:11<19:56:32, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:47:11<19:56:32, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:45:15,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:47:18<24:14:52, 5.21s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:47:18<24:14:52, 5.21s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4733, 'learning_rate': 2.983254156769596e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-15 21:45:23,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:47:25<27:00:01, 5.80s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:47:25<27:00:01, 5.80s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6343, 'learning_rate': 2.983076009501188e-05, 'epoch': 1.23} + 6%|████▍ | 1095/17840 [1:47:25<27:00:01, 5.80s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:47:25<27:00:01, 5.80s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:47:32<28:53:10, 6.21s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:47:32<28:53:10, 6.21s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.693, 'learning_rate': 2.982897862232779e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-15 21:45:37,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:47:39<30:07:55, 6.48s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:47:39<30:07:55, 6.48s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6925, 'learning_rate': 2.9827197149643708e-05, 'epoch': 1.23} + 6%|████▍ | 1097/17840 [1:47:39<30:07:55, 6.48s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:47:39<30:07:55, 6.48s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:47:39<30:07:55, 6.48s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1098/17840 [1:47:47<30:55:53, 6.65s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1098/17840 [1:47:47<30:55:53, 6.65s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:45:51,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:47:54<31:30:37, 6.78s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:47:54<31:30:37, 6.78s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6463, 'learning_rate': 2.9823634204275537e-05, 'epoch': 1.23} + 6%|████▍ | 1099/17840 [1:47:54<31:30:37, 6.78s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:47:54<31:30:37, 6.78s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:48:02<33:40:49, 7.24s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:48:02<33:40:49, 7.24s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6959, 'learning_rate': 2.982185273159145e-05, 'epoch': 1.23} + 6%|████▌ | 1100/17840 [1:48:02<33:40:49, 7.24s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:48:02<33:40:49, 7.24s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1101/17840 [1:48:09<33:24:30, 7.19s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1101/17840 [1:48:09<33:24:30, 7.19s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:46:12,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:46:12,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:48:16<33:10:36, 7.14s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:48:16<33:10:36, 7.14s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3267, 'learning_rate': 2.981828978622328e-05, 'epoch': 1.24} + 6%|████▌ | 1102/17840 [1:48:16<33:10:36, 7.14s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:48:16<33:10:36, 7.14s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:48:16<33:10:36, 7.14s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1103/17840 [1:48:23<32:45:35, 7.05s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:46:26,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:46:26,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:48:30<32:28:58, 6.99s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:48:30<32:28:58, 6.99s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4892, 'learning_rate': 2.9814726840855108e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-15 21:46:34,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:48:36<32:12:35, 6.93s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:48:36<32:12:35, 6.93s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4533, 'learning_rate': 2.981294536817102e-05, 'epoch': 1.24} + 6%|████▌ | 1105/17840 [1:48:36<32:12:35, 6.93s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:48:36<32:12:35, 6.93s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:48:36<32:12:35, 6.93s/it]g-point operations will not be computed-15 21:45:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:48:43<32:00:01, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:48:43<32:00:01, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:48:43<32:00:01, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:48:50<31:47:13, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:48:50<31:47:13, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3676, 'learning_rate': 2.980938242280285e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-15 21:46:54,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:48:57<31:29:56, 6.78s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:48:57<31:29:56, 6.78s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2577, 'learning_rate': 2.9807600950118767e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:01,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:49:03<31:25:25, 6.76s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:49:03<31:25:25, 6.76s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3262, 'learning_rate': 2.9805819477434678e-05, 'epoch': 1.24} + 6%|████▌ | 1109/17840 [1:49:03<31:25:25, 6.76s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:09,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:09,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3419, 'learning_rate': 2.9804038004750596e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:09,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:09,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:49:17<31:04:58, 6.69s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:49:17<31:04:58, 6.69s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4674, 'learning_rate': 2.9802256532066508e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:21,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:21,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1112/17840 [1:49:23<30:53:24, 6.65s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1112/17840 [1:49:23<30:53:24, 6.65s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:27,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:27,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:49:30<30:40:20, 6.60s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:49:30<30:40:20, 6.60s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:49:30<30:40:20, 6.60s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:49:30<30:40:20, 6.60s/it]g-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:35,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:35,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:35,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:35,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:42,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:42,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:42,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:42,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:47:42,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:46:44,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1116/17840 [1:49:49<30:10:18, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:50,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1116/17840 [1:49:49<30:10:18, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:50,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1116/17840 [1:49:49<30:10:18, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:50,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1116/17840 [1:49:49<30:10:18, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:50,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:49:55<30:04:30, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:49:55<30:04:30, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:49:55<30:04:30, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:49:55<30:04:30, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:47:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:50:02<29:51:44, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:50:02<29:51:44, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:50:02<29:51:44, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:50:02<29:51:44, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:50:08<29:39:41, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:10,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:10,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:10,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:50:14<29:29:01, 6.35s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:50:14<29:29:01, 6.35s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:18,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:18,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:50:20<29:11:10, 6.28s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:23,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:23,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:23,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1122/17840 [1:50:26<28:50:08, 6.21s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:29,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:29,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:29,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1123/17840 [1:50:32<28:36:33, 6.16s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:35,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:35,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:35,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1124/17840 [1:50:38<28:25:36, 6.12s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:41,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:41,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:50:46<29:42:17, 6.40s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:50:46<29:42:17, 6.40s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4242, 'learning_rate': 2.977731591448931e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:49,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1126/17840 [1:50:51<28:55:09, 6.23s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1126/17840 [1:50:51<28:55:09, 6.23s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5484, 'learning_rate': 2.9775534441805226e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:55,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:55,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1127/17840 [1:50:57<28:08:03, 6.06s/it]g-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:59,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:59,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:48:59,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:48:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1128/17840 [1:51:03<27:24:04, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:49:03,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1128/17840 [1:51:03<27:24:04, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:49:03,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:07,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:03,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:07,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:03,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5013, 'learning_rate': 2.977019002375297e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:11,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:03,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:11,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:03,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1130/17840 [1:51:13<26:07:56, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:49:14,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1130/17840 [1:51:13<26:07:56, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:49:14,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:18,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:14,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:18,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:14,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3866, 'learning_rate': 2.97666270783848e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:21,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:14,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1132/17840 [1:51:23<24:39:31, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1132/17840 [1:51:23<24:39:31, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:26,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:26,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1133/17840 [1:51:28<23:38:44, 5.10s/it]g-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:29,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:31,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:31,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:33,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:35,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:35,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:37,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:37,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:39,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:41,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:41,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:44,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:46,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:46,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:48,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:48,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:50,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:50,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:52,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:52,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:55,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:56,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:56,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1629, 'learning_rate': 2.9748812351543943e-05, 'epoch': 1.28} +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:59,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:59,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:49:59,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:03,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:07,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:07,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:10,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:10,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4718, 'learning_rate': 2.9745249406175773e-05, 'epoch': 1.28} +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:14,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:14,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:14,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:52:18<26:20:17, 5.68s/it]g-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:21,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:21,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:52:25<28:14:54, 6.09s/it]g-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:52:25<28:14:54, 6.09s/it]g-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6693, 'learning_rate': 2.9741686460807603e-05, 'epoch': 1.28} + 6%|████▋ | 1146/17840 [1:52:25<28:14:54, 6.09s/it]g-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:52:25<28:14:54, 6.09s/it]g-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:52:25<28:14:54, 6.09s/it]g-point operations will not be computed-15 21:49:24,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:52:32<29:33:22, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:52:32<29:33:22, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:52:32<29:33:22, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:52:39<30:32:58, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:52:39<30:32:58, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5151, 'learning_rate': 2.973812351543943e-05, 'epoch': 1.29} + 6%|████▋ | 1148/17840 [1:52:39<30:32:58, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:45,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:45,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4528, 'learning_rate': 2.9736342042755347e-05, 'epoch': 1.29} +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:45,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:50:45,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:52:54<33:09:04, 7.15s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:52:54<33:09:04, 7.15s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4348, 'learning_rate': 2.9734560570071258e-05, 'epoch': 1.29} + 6%|████▋ | 1150/17840 [1:52:54<33:09:04, 7.15s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:52:54<33:09:04, 7.15s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:53:01<32:52:36, 7.09s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:53:01<32:52:36, 7.09s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:04,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:04,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:04,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:53:08<32:36:58, 7.04s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:53:08<32:36:58, 7.04s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:53:08<32:36:58, 7.04s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:14,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:14,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3996, 'learning_rate': 2.9729216152019006e-05, 'epoch': 1.29} +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:14,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:14,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:14,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:53:22<32:00:41, 6.91s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:25,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:25,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:25,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:53:29<31:58:17, 6.90s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:53:29<31:58:17, 6.90s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:33,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:33,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1156/17840 [1:53:35<31:40:55, 6.84s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1156/17840 [1:53:35<31:40:55, 6.84s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1156/17840 [1:53:35<31:40:55, 6.84s/it]g-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.344, 'learning_rate': 2.9722090261282658e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:50:33,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:53:49<31:16:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:53:49<31:16:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:53:49<31:16:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:53:49<31:16:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:53:55<30:59:53, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:53:55<30:59:53, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:51:59,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▋ | 1160/17840 [1:54:02<30:54:22, 6.67s/it]g-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▋ | 1160/17840 [1:54:02<30:54:22, 6.67s/it]g-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.316, 'learning_rate': 2.9716745843230406e-05, 'epoch': 1.3} + 7%|████▋ | 1160/17840 [1:54:02<30:54:22, 6.67s/it]g-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:08,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:08,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4866, 'learning_rate': 2.9714964370546317e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:08,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:08,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:08,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:51:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:54:15<30:33:12, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:54:15<30:33:12, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:54:15<30:33:12, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:54:15<30:33:12, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:54:21<30:19:24, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:24,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:24,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:24,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1164/17840 [1:54:28<30:06:28, 6.50s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1165/17840 [1:54:34<29:58:14, 6.47s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1165/17840 [1:54:34<29:58:14, 6.47s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3991, 'learning_rate': 2.9707838479809976e-05, 'epoch': 1.31} + 7%|████▊ | 1165/17840 [1:54:34<29:58:14, 6.47s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:54:41<29:41:39, 6.41s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:54:41<29:41:39, 6.41s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:43,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:43,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:54:47<29:34:14, 6.38s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:54:47<29:34:14, 6.38s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:49,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:49,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:54:53<29:17:47, 6.33s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:54:53<29:17:47, 6.33s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4064, 'learning_rate': 2.970249406175772e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-15 21:52:57,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1169/17840 [1:54:59<29:10:32, 6.30s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1169/17840 [1:54:59<29:10:32, 6.30s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:02,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:02,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:55:05<28:50:26, 6.23s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:55:05<28:50:26, 6.23s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5785, 'learning_rate': 2.969893111638955e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:09,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:55:11<28:39:41, 6.19s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:55:11<28:39:41, 6.19s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4418, 'learning_rate': 2.9697149643705465e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:15,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:55:18<28:29:20, 6.15s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:55:18<28:29:20, 6.15s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:20,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:20,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:55:24<28:16:19, 6.11s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:55:24<28:16:19, 6.11s/it]g-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:26,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:26,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:52:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:55:29<27:58:58, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:55:29<27:58:58, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3615, 'learning_rate': 2.9691805225653205e-05, 'epoch': 1.32} + 7%|████▊ | 1174/17840 [1:55:29<27:58:58, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:55:36<29:15:56, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:55:36<29:15:56, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3968, 'learning_rate': 2.9690023752969124e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:40,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1176/17840 [1:55:42<28:24:38, 6.14s/it]g-point operations will not be computed-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1176/17840 [1:55:42<28:24:38, 6.14s/it]g-point operations will not be computed-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:44,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:44,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:44,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:30,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:55:48<27:39:14, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:55:48<27:39:14, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:52,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:52,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2672, 'learning_rate': 2.9684679334916864e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:52,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:58,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:53:58,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:00,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:00,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:53:48,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1180/17840 [1:56:04<25:42:06, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1180/17840 [1:56:04<25:42:06, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2869, 'learning_rate': 2.9681116389548694e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:08,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:08,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:10,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:13,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:13,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4809, 'learning_rate': 2.9677553444180523e-05, 'epoch': 1.33} +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:16,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1183/17840 [1:56:18<23:18:15, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:19,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1183/17840 [1:56:18<23:18:15, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:19,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:21,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:19,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1184/17840 [1:56:23<22:19:07, 4.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:23,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1184/17840 [1:56:23<22:19:07, 4.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:23,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:25,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:23,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1185/17840 [1:56:27<21:13:03, 4.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:27,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1185/17840 [1:56:27<21:13:03, 4.59s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:27,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:29,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:27,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:29,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:27,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1186/17840 [1:56:30<20:05:12, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:31,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1187/17840 [1:56:34<18:49:19, 4.07s/it]g-point operations will not be computed-15 21:54:31,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1187/17840 [1:56:34<18:49:19, 4.07s/it]g-point operations will not be computed-15 21:54:31,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1187/17840 [1:56:34<18:49:19, 4.07s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:34,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1188/17840 [1:56:37<17:27:15, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:37,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1188/17840 [1:56:37<17:27:15, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:37,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1189/17840 [1:56:40<16:15:20, 3.51s/it]g-point operations will not be computed-15 21:54:37,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1189/17840 [1:56:40<16:15:20, 3.51s/it]g-point operations will not be computed-15 21:54:37,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:41,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:40,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:41,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:40,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:42,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:42,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:45,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:44,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:45,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:44,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1192/17840 [1:56:47<12:25:32, 2.69s/it]g-point operations will not be computed-15 21:54:44,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1192/17840 [1:56:47<12:25:32, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:48,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1192/17840 [1:56:47<12:25:32, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:48,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:52,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:48,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:52,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:48,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1193/17840 [1:56:54<19:06:08, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:55,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1193/17840 [1:56:54<19:06:08, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:54:55,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:54:59,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:54:55,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:57:02<23:34:32, 5.10s/it]g-point operations will not be computed-15 21:54:55,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:57:02<23:34:32, 5.10s/it]g-point operations will not be computed-15 21:54:55,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:57:02<23:34:32, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:57:02<23:34:32, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:57:02<23:34:32, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1195/17840 [1:57:09<26:42:16, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1195/17840 [1:57:09<26:42:16, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6381, 'learning_rate': 2.9654394299287412e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:14,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [1:57:16<28:39:35, 6.20s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [1:57:16<28:39:35, 6.20s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7028, 'learning_rate': 2.9652612826603327e-05, 'epoch': 1.34} + 7%|████▉ | 1196/17840 [1:57:16<28:39:35, 6.20s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [1:57:16<28:39:35, 6.20s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [1:57:23<30:03:43, 6.50s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [1:57:23<30:03:43, 6.50s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.629, 'learning_rate': 2.965083135391924e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:28,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [1:57:30<30:47:26, 6.66s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [1:57:30<30:47:26, 6.66s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4781, 'learning_rate': 2.9649049881235156e-05, 'epoch': 1.34} + 7%|████▉ | 1198/17840 [1:57:30<30:47:26, 6.66s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [1:57:30<30:47:26, 6.66s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [1:57:37<31:15:48, 6.76s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [1:57:37<31:15:48, 6.76s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:40,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:40,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:40,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:40,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:40,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:48,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:48,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [1:57:53<33:01:02, 7.14s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [1:57:53<33:01:02, 7.14s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4105, 'learning_rate': 2.9643705463182897e-05, 'epoch': 1.35} + 7%|████▉ | 1201/17840 [1:57:53<33:01:02, 7.14s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:59,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:59,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.469, 'learning_rate': 2.9641923990498815e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:59,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:55:59,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [1:58:06<32:24:15, 7.01s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [1:58:06<32:24:15, 7.01s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:09,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:09,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:58:13<32:04:00, 6.94s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:58:13<32:04:00, 6.94s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3391, 'learning_rate': 2.9638361045130645e-05, 'epoch': 1.35} + 7%|████▉ | 1204/17840 [1:58:13<32:04:00, 6.94s/it]g-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:19,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:19,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3521, 'learning_rate': 2.9636579572446556e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:19,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:19,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:55:03,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [1:58:27<31:35:19, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [1:58:27<31:35:19, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3176, 'learning_rate': 2.963479809976247e-05, 'epoch': 1.35} + 7%|████▉ | 1206/17840 [1:58:27<31:35:19, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [1:58:33<31:17:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [1:58:33<31:17:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3595, 'learning_rate': 2.9633016627078385e-05, 'epoch': 1.35} + 7%|████▉ | 1207/17840 [1:58:33<31:17:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [1:58:33<31:17:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:39,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:39,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2819, 'learning_rate': 2.9629453681710215e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:56:44,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:27,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:58:53<30:48:49, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:58:53<30:48:49, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:58:53<30:48:49, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:58:53<30:48:49, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [1:59:00<30:39:52, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [1:59:00<30:39:52, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:04,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [1:59:06<30:33:38, 6.62s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [1:59:06<30:33:38, 6.62s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4521, 'learning_rate': 2.9624109263657956e-05, 'epoch': 1.36} + 7%|████▉ | 1212/17840 [1:59:06<30:33:38, 6.62s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [1:59:06<30:33:38, 6.62s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:12,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:12,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:12,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:18,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:18,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3495, 'learning_rate': 2.9620546318289785e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:18,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:18,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [1:59:26<30:09:10, 6.53s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [1:59:26<30:09:10, 6.53s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:28,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:28,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1216/17840 [1:59:32<30:00:01, 6.50s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1216/17840 [1:59:32<30:00:01, 6.50s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:35,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:35,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:59:38<29:47:19, 6.45s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:59:38<29:47:19, 6.45s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:41,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:41,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [1:59:45<29:33:10, 6.40s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [1:59:45<29:33:10, 6.40s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:47,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:47,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:47,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:59:51<29:18:37, 6.35s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:59:51<29:18:37, 6.35s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:55,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:57:55,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [1:59:57<29:09:31, 6.32s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [1:59:57<29:09:31, 6.32s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:01,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:01,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [2:00:03<28:54:54, 6.26s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [2:00:03<28:54:54, 6.26s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:07,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:07,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [2:00:09<28:41:43, 6.22s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [2:00:09<28:41:43, 6.22s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:13,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:13,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1223/17840 [2:00:16<28:36:28, 6.20s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1223/17840 [2:00:16<28:36:28, 6.20s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:19,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:19,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [2:00:22<28:27:25, 6.17s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [2:00:22<28:27:25, 6.17s/it]g-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:25,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:25,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:56:54,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [2:00:29<29:53:49, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [2:00:29<29:53:49, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:34,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:34,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4846, 'learning_rate': 2.9599168646080762e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:34,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:40,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:40,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4179, 'learning_rate': 2.9597387173396674e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:44,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:44,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [2:00:46<27:32:12, 5.97s/it]g-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [2:00:46<27:32:12, 5.97s/it]g-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:49,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:49,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [2:00:52<26:57:32, 5.84s/it]g-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:54,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:56,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:58:56,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1383, 'learning_rate': 2.9592042755344418e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:00,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [2:01:02<25:46:08, 5.59s/it]g-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [2:01:02<25:46:08, 5.59s/it]g-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:04,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:07,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:07,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4068, 'learning_rate': 2.9588479809976247e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:10,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:10,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:58:30,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1233/17840 [2:01:12<24:11:36, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1233/17840 [2:01:12<24:11:36, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:16,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:16,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:18,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:20,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:20,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:22,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:24,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:24,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:26,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:26,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:28,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:31,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:31,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:33,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:34,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:34,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:37,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:37,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:38,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:38,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:41,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:41,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:41,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:41,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:45,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:49,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:49,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6208, 'learning_rate': 2.9568883610451306e-05, 'epoch': 1.39} +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:53,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:53,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:56,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:56,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3676, 'learning_rate': 2.956710213776722e-05, 'epoch': 1.39} +[WARNING|modeling_utils.py:388] 2022-03-15 21:59:56,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:04,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:04,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5592, 'learning_rate': 2.9565320665083136e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:04,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:04,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:02:12<28:32:38, 6.19s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:02:12<28:32:38, 6.19s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3373, 'learning_rate': 2.956353919239905e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:16,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:02:19<29:39:38, 6.44s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:02:19<29:39:38, 6.44s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4591, 'learning_rate': 2.9561757719714965e-05, 'epoch': 1.4} + 7%|█████ | 1247/17840 [2:02:19<29:39:38, 6.44s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:02:19<29:39:38, 6.44s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:02:26<30:29:05, 6.61s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:02:26<30:29:05, 6.61s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3946, 'learning_rate': 2.955997624703088e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:30,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:02:33<31:03:30, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:02:33<31:03:30, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3837, 'learning_rate': 2.9558194774346795e-05, 'epoch': 1.4} + 7%|█████ | 1249/17840 [2:02:33<31:03:30, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:02:33<31:03:30, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:02:41<33:06:48, 7.19s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:02:41<33:06:48, 7.19s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3922, 'learning_rate': 2.9556413301662706e-05, 'epoch': 1.4} + 7%|█████ | 1250/17840 [2:02:41<33:06:48, 7.19s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:02:41<33:06:48, 7.19s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:02:48<32:45:53, 7.11s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:02:48<32:45:53, 7.11s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:50,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:00:50,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:02:55<32:27:23, 7.04s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:02:55<32:27:23, 7.04s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1098, 'learning_rate': 2.9552850356294536e-05, 'epoch': 1.4} + 7%|█████ | 1252/17840 [2:02:55<32:27:23, 7.04s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:01,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:01,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:01,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0832, 'learning_rate': 2.9551068883610454e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:01,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:03:08<32:09:00, 6.98s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:03:08<32:09:00, 6.98s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:11,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:11,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:11,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:03:15<31:47:36, 6.90s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:03:15<31:47:36, 6.90s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:19,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1256/17840 [2:03:22<31:34:33, 6.85s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1256/17840 [2:03:22<31:34:33, 6.85s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2023, 'learning_rate': 2.9545724465558195e-05, 'epoch': 1.41} + 7%|█████▏ | 1256/17840 [2:03:22<31:34:33, 6.85s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:28,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:28,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:28,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2902, 'learning_rate': 2.954394299287411e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:28,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:03:35<31:11:08, 6.77s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:03:35<31:11:08, 6.77s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3474, 'learning_rate': 2.9542161520190024e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:39,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:39,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:03:42<31:03:25, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:03:42<31:03:25, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:03:42<31:03:25, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:03:42<31:03:25, 6.74s/it]g-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:48,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:48,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:48,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:48,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:01:48,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 21:59:13,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [2:03:55<30:40:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [2:03:55<30:40:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [2:03:55<30:40:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [2:03:55<30:40:45, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:04:02<30:45:37, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:05,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:05,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:05,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:04:09<30:58:10, 6.73s/it]g-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:04:09<30:58:10, 6.73s/it]g-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:04:09<30:58:10, 6.73s/it]g-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:04:09<30:58:10, 6.73s/it]g-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:04:09<30:58:10, 6.73s/it]g-point operations will not be computed-15 22:01:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:04:15<30:58:17, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:04:15<30:58:17, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:04:15<30:58:17, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:04:15<30:58:17, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [2:04:22<30:45:28, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:24,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:24,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:24,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1266/17840 [2:04:28<30:13:17, 6.56s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:31,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:31,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:31,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1267/17840 [2:04:35<29:50:49, 6.48s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:37,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:37,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:37,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [2:04:41<29:31:15, 6.41s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:43,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:43,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:43,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1269/17840 [2:04:47<29:11:04, 6.34s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:49,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:49,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:49,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1270/17840 [2:04:53<28:56:16, 6.29s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:55,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:55,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:02:55,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [2:04:59<28:39:48, 6.23s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:02,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:02,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:02,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [2:05:05<28:26:49, 6.18s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:08,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:08,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:08,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1273/17840 [2:05:12<28:24:04, 6.17s/it]g-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:14,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:14,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:14,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:02:16,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:05:18<28:12:01, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:05:18<28:12:01, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:05:18<28:12:01, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1275/17840 [2:05:25<29:46:14, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1275/17840 [2:05:25<29:46:14, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2636, 'learning_rate': 2.951187648456057e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:28,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1276/17840 [2:05:31<28:56:35, 6.29s/it]g-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1276/17840 [2:05:31<28:56:35, 6.29s/it]g-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2214, 'learning_rate': 2.9510095011876483e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:34,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1277/17840 [2:05:36<28:07:38, 6.11s/it]g-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1277/17840 [2:05:36<28:07:38, 6.11s/it]g-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:38,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:38,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:38,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1278/17840 [2:05:42<27:25:32, 5.96s/it]g-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:44,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:47,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:47,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4157, 'learning_rate': 2.950475059382423e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:51,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1280/17840 [2:05:53<26:13:34, 5.70s/it]g-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1280/17840 [2:05:53<26:13:34, 5.70s/it]g-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:55,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:55,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:03:55,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:18,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [2:05:58<25:34:56, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:03:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [2:05:58<25:34:56, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:03:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:02,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:02,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:05,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:05,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:03:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1283/17840 [2:06:08<24:27:37, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1283/17840 [2:06:08<24:27:37, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:11,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1284/17840 [2:06:13<23:35:58, 5.13s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1284/17840 [2:06:13<23:35:58, 5.13s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:14,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:17,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:17,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:19,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:21,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:21,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:23,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:24,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:24,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:26,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:26,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:29,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:31,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:31,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:34,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:34,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:35,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:37,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:37,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:38,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:38,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0567, 'learning_rate': 2.9481591448931116e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:42,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:46,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:46,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5259, 'learning_rate': 2.947980997624703e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:50,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:50,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5864, 'learning_rate': 2.9478028503562945e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:04:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1295/17840 [2:07:01<26:47:49, 5.83s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1295/17840 [2:07:01<26:47:49, 5.83s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5042, 'learning_rate': 2.947624703087886e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:06,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:07:09<28:43:28, 6.25s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:07:09<28:43:28, 6.25s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4544, 'learning_rate': 2.9474465558194775e-05, 'epoch': 1.45} + 7%|█████▎ | 1296/17840 [2:07:09<28:43:28, 6.25s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:07:09<28:43:28, 6.25s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1297/17840 [2:07:16<29:58:43, 6.52s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1297/17840 [2:07:16<29:58:43, 6.52s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3121, 'learning_rate': 2.947268408551069e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:20,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:20,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:07:23<30:49:52, 6.71s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:07:23<30:49:52, 6.71s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:07:23<30:49:52, 6.71s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:07:23<30:49:52, 6.71s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:07:23<30:49:52, 6.71s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1299/17840 [2:07:30<31:23:02, 6.83s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:33,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:33,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:33,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:07:38<33:21:53, 7.26s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:07:38<33:21:53, 7.26s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:43,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:43,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:07:45<33:05:59, 7.20s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:07:45<33:05:59, 7.20s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:07:45<33:05:59, 7.20s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:07:45<33:05:59, 7.20s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:07:45<33:05:59, 7.20s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1302/17840 [2:07:52<32:47:26, 7.14s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:55,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:55,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:05:55,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:07:59<32:28:04, 7.07s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:07:59<32:28:04, 7.07s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:07:59<32:28:04, 7.07s/it]g-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:05,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:05,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2877, 'learning_rate': 2.9460213776722093e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:05,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:05,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:05,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:04:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [2:08:13<31:50:33, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:08:20<31:37:11, 6.88s/it]g-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:08:20<31:37:11, 6.88s/it]g-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:08:20<31:37:11, 6.88s/it]g-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:26,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:26,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1489, 'learning_rate': 2.9454869358669834e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:26,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:26,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:26,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:14,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:08:33<31:10:44, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:08:33<31:10:44, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:08:33<31:10:44, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:08:33<31:10:44, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1309/17840 [2:08:40<30:55:37, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1309/17840 [2:08:40<30:55:37, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:44,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:44,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1310/17840 [2:08:46<30:40:54, 6.68s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1310/17840 [2:08:46<30:40:54, 6.68s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1310/17840 [2:08:46<30:40:54, 6.68s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:52,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:52,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2861, 'learning_rate': 2.9447743467933493e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:52,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:58,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:58,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4083, 'learning_rate': 2.9445961995249407e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:58,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:58,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:06:58,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:09:06<30:17:44, 6.60s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:08,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:08,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:08,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:09:12<30:08:04, 6.56s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:15,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:15,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:15,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1315/17840 [2:09:19<29:59:59, 6.54s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1315/17840 [2:09:19<29:59:59, 6.54s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1315/17840 [2:09:19<29:59:59, 6.54s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:24,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:24,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2047, 'learning_rate': 2.9438836104513063e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:24,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:31,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:31,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3066, 'learning_rate': 2.943705463182898e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:35,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:09:38<29:17:31, 6.38s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:09:38<29:17:31, 6.38s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3766, 'learning_rate': 2.9435273159144892e-05, 'epoch': 1.48} + 7%|█████▍ | 1318/17840 [2:09:38<29:17:31, 6.38s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:43,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:43,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3927, 'learning_rate': 2.943349168646081e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:43,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:49,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:49,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4075, 'learning_rate': 2.9431710213776722e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-15 22:07:54,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1321/17840 [2:09:56<28:34:52, 6.23s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1321/17840 [2:09:56<28:34:52, 6.23s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2476, 'learning_rate': 2.942992874109264e-05, 'epoch': 1.48} + 7%|█████▍ | 1321/17840 [2:09:56<28:34:52, 6.23s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:01,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:01,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4103, 'learning_rate': 2.942814726840855e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:06,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1323/17840 [2:10:08<28:06:00, 6.12s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1323/17840 [2:10:08<28:06:00, 6.12s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3124, 'learning_rate': 2.9426365795724466e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1324/17840 [2:10:14<27:59:31, 6.10s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1324/17840 [2:10:14<27:59:31, 6.10s/it]g-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2569, 'learning_rate': 2.942458432304038e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:18,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:18,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:06:34,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:10:22<29:27:23, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:10:22<29:27:23, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:27,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:27,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2743, 'learning_rate': 2.942102137767221e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:27,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:32,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:32,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.401, 'learning_rate': 2.9419239904988122e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:37,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1328/17840 [2:10:39<27:24:02, 5.97s/it]g-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1328/17840 [2:10:39<27:24:02, 5.97s/it]g-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:41,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:41,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:22,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1329/17840 [2:10:44<26:48:21, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1329/17840 [2:10:44<26:48:21, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5056, 'learning_rate': 2.941567695961995e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:49,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:49,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3042, 'learning_rate': 2.941389548693587e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:53,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [2:10:55<25:25:45, 5.55s/it]g-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [2:10:55<25:25:45, 5.55s/it]g-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:57,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:59,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:08:59,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3328, 'learning_rate': 2.94103325415677e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:03,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:03,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:08:45,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1333/17840 [2:11:05<23:47:11, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:05,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:07,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:05,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1334/17840 [2:11:09<22:39:01, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:09,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1334/17840 [2:11:09<22:39:01, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:09,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:11,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:09,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1335/17840 [2:11:13<21:30:05, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:13,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1335/17840 [2:11:13<21:30:05, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:13,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:15,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:13,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1336/17840 [2:11:17<20:18:10, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1336/17840 [2:11:17<20:18:10, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:19,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:19,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1337/17840 [2:11:21<19:08:18, 4.17s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:21,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1338/17840 [2:11:24<17:57:08, 3.92s/it]g-point operations will not be computed-15 22:09:21,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1338/17840 [2:11:24<17:57:08, 3.92s/it]g-point operations will not be computed-15 22:09:21,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:25,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:24,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1339/17840 [2:11:27<16:41:40, 3.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:27,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1339/17840 [2:11:27<16:41:40, 3.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:27,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1340/17840 [2:11:30<15:17:54, 3.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:29,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1340/17840 [2:11:30<15:17:54, 3.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:29,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1341/17840 [2:11:32<14:03:19, 3.07s/it]g-point operations will not be computed-15 22:09:29,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1341/17840 [2:11:32<14:03:19, 3.07s/it]g-point operations will not be computed-15 22:09:29,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1342/17840 [2:11:34<12:47:08, 2.79s/it]g-point operations will not be computed-15 22:09:32,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1342/17840 [2:11:34<12:47:08, 2.79s/it]g-point operations will not be computed-15 22:09:32,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1342/17840 [2:11:34<12:47:08, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:35,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1342/17840 [2:11:34<12:47:08, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:35,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:39,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:35,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1343/17840 [2:11:42<19:11:28, 4.19s/it]g-point operations will not be computed-15 22:09:35,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1343/17840 [2:11:42<19:11:28, 4.19s/it]g-point operations will not be computed-15 22:09:35,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1343/17840 [2:11:42<19:11:28, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:43,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1343/17840 [2:11:42<19:11:28, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:43,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:46,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:43,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:09:46,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:43,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1344/17840 [2:11:49<23:24:25, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1344/17840 [2:11:49<23:24:25, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1344/17840 [2:11:49<23:24:25, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:11:56<26:14:57, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:11:56<26:14:57, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5274, 'learning_rate': 2.9387173396674584e-05, 'epoch': 1.51} + 8%|█████▌ | 1345/17840 [2:11:56<26:14:57, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:02,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:02,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:02,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3597, 'learning_rate': 2.93853919239905e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:02,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:12:10<29:27:45, 6.43s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:12:10<29:27:45, 6.43s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4135, 'learning_rate': 2.9383610451306413e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:15,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:12:17<30:21:20, 6.63s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:12:17<30:21:20, 6.63s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4635, 'learning_rate': 2.9381828978622328e-05, 'epoch': 1.51} + 8%|█████▌ | 1348/17840 [2:12:17<30:21:20, 6.63s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:12:17<30:21:20, 6.63s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:12:17<30:21:20, 6.63s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:12:24<31:00:33, 6.77s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:12:24<31:00:33, 6.77s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:29,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:29,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:12:33<33:07:16, 7.23s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:12:33<33:07:16, 7.23s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:12:33<33:07:16, 7.23s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:39,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:39,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3821, 'learning_rate': 2.9376484560570072e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:39,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:39,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:39,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:12:47<32:28:53, 7.09s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:49,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:49,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:10:49,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:12:53<32:08:58, 7.02s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:12:53<32:08:58, 7.02s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:12:53<32:08:58, 7.02s/it]g-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:00,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:00,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3423, 'learning_rate': 2.9371140142517813e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:00,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:00,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:00,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:09:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:13:07<31:44:42, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:13:07<31:44:42, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:13:07<31:44:42, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:13:07<31:44:42, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:13:14<31:27:10, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:13:14<31:27:10, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:13:14<31:27:10, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:20,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:20,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2789, 'learning_rate': 2.936579572446556e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:20,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:20,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:20,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:08,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:13:27<31:04:04, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:13:27<31:04:04, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:13:27<31:04:04, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:13:27<31:04:04, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:13:34<30:49:59, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:36,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:36,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:36,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:13:41<30:38:06, 6.69s/it]g-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:13:41<30:38:06, 6.69s/it]g-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:45,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1361/17840 [2:13:47<30:29:11, 6.66s/it]g-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1361/17840 [2:13:47<30:29:11, 6.66s/it]g-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.972, 'learning_rate': 2.9358669833729217e-05, 'epoch': 1.53} + 8%|█████▌ | 1361/17840 [2:13:47<30:29:11, 6.66s/it]g-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:53,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:53,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4481, 'learning_rate': 2.935688836104513e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:53,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:59,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:59,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2073, 'learning_rate': 2.9355106888361046e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:59,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:59,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:11:59,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:11:28,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:14:07<30:00:39, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:07,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:14:07<30:00:39, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:07,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:14:07<30:00:39, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:07,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:14:07<30:00:39, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:07,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1365/17840 [2:14:13<29:41:33, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1365/17840 [2:14:13<29:41:33, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1365/17840 [2:14:13<29:41:33, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:14:19<29:33:59, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:14:19<29:33:59, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:22,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:22,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:14:26<29:24:10, 6.43s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:14:26<29:24:10, 6.43s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:28,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:28,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:14:32<29:10:43, 6.38s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:14:32<29:10:43, 6.38s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:14:38<28:55:59, 6.32s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:14:38<28:55:59, 6.32s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:41,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:41,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1370/17840 [2:14:44<28:49:05, 6.30s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1370/17840 [2:14:44<28:49:05, 6.30s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:47,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:47,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1371/17840 [2:14:51<28:37:58, 6.26s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1371/17840 [2:14:51<28:37:58, 6.26s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.349, 'learning_rate': 2.934085510688836e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-15 22:12:54,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1372/17840 [2:14:57<28:19:18, 6.19s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1372/17840 [2:14:57<28:19:18, 6.19s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3165, 'learning_rate': 2.933907363420428e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:00,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1373/17840 [2:15:03<28:08:13, 6.15s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1373/17840 [2:15:03<28:08:13, 6.15s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:05,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:05,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1374/17840 [2:15:09<27:54:40, 6.10s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1374/17840 [2:15:09<27:54:40, 6.10s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:11,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:11,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:15:16<29:16:39, 6.40s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:15:16<29:16:39, 6.40s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3413, 'learning_rate': 2.933372921615202e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:19,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1376/17840 [2:15:22<28:23:51, 6.21s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1376/17840 [2:15:22<28:23:51, 6.21s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:24,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:24,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:15:27<27:33:13, 6.03s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:15:27<27:33:13, 6.03s/it]g-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:29,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:29,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:12:14,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:15:33<26:57:33, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:15:33<26:57:33, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2106, 'learning_rate': 2.932838479809976e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:37,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:37,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4286, 'learning_rate': 2.932660332541568e-05, 'epoch': 1.55} +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:37,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:43,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:43,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:46,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:46,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:46,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:33,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1381/17840 [2:15:49<25:28:05, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1381/17840 [2:15:49<25:28:05, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:53,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:53,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:56,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:13:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0846, 'learning_rate': 2.9319477434679338e-05, 'epoch': 1.55} +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:01,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:01,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:13:50,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1384/17840 [2:16:03<22:32:34, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:03,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:05,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:03,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:05,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:03,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1385/17840 [2:16:07<21:30:09, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:07,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:09,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:07,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:09,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:07,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1386/17840 [2:16:11<20:24:30, 4.47s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:11,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1387/17840 [2:16:15<19:12:55, 4.20s/it]g-point operations will not be computed-15 22:14:11,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1387/17840 [2:16:15<19:12:55, 4.20s/it]g-point operations will not be computed-15 22:14:11,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1387/17840 [2:16:15<19:12:55, 4.20s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:15,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1388/17840 [2:16:18<17:55:02, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:18,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1388/17840 [2:16:18<17:55:02, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:18,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1389/17840 [2:16:21<16:30:29, 3.61s/it]g-point operations will not be computed-15 22:14:18,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1389/17840 [2:16:21<16:30:29, 3.61s/it]g-point operations will not be computed-15 22:14:18,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:22,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:21,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:24,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:23,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:24,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:23,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1391/17840 [2:16:26<13:48:25, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:26,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1391/17840 [2:16:26<13:48:25, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:26,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1392/17840 [2:16:28<12:37:51, 2.76s/it]g-point operations will not be computed-15 22:14:26,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1392/17840 [2:16:28<12:37:51, 2.76s/it]g-point operations will not be computed-15 22:14:26,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1392/17840 [2:16:28<12:37:51, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:29,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1392/17840 [2:16:28<12:37:51, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:29,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:33,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:29,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1393/17840 [2:16:36<19:15:53, 4.22s/it]g-point operations will not be computed-15 22:14:29,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1393/17840 [2:16:36<19:15:53, 4.22s/it]g-point operations will not be computed-15 22:14:29,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1393/17840 [2:16:36<19:15:53, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:37,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:40,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:37,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1394/17840 [2:16:43<23:40:12, 5.18s/it]g-point operations will not be computed-15 22:14:37,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1394/17840 [2:16:43<23:40:12, 5.18s/it]g-point operations will not be computed-15 22:14:37,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1394/17840 [2:16:43<23:40:12, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1394/17840 [2:16:43<23:40:12, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1394/17840 [2:16:43<23:40:12, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:16:50<26:35:31, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:16:50<26:35:31, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4418, 'learning_rate': 2.9298099762470308e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:55,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:14:55,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:16:58<28:28:30, 6.23s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:16:58<28:28:30, 6.23s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:16:58<28:28:30, 6.23s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:16:58<28:28:30, 6.23s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:16:58<28:28:30, 6.23s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:17:05<29:40:31, 6.50s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:17:05<29:40:31, 6.50s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:09,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:09,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:17:12<30:37:50, 6.71s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:17:12<30:37:50, 6.71s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:17:12<30:37:50, 6.71s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:17:12<30:37:50, 6.71s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:17:12<30:37:50, 6.71s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:17:19<31:14:17, 6.84s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:17:19<31:14:17, 6.84s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:24,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:24,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:17:27<33:20:45, 7.30s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:17:27<33:20:45, 7.30s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:17:27<33:20:45, 7.30s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:34,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:34,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3201, 'learning_rate': 2.9287410926365796e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:34,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:34,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:34,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1402/17840 [2:17:41<32:36:22, 7.14s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:44,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:44,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:44,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:17:48<32:16:16, 7.07s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:17:48<32:16:16, 7.07s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:17:48<32:16:16, 7.07s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:54,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:54,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3898, 'learning_rate': 2.928206650831354e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:54,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:54,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:15:54,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:18:02<31:47:42, 6.96s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:18:02<31:47:42, 6.96s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:06,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:06,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:18:09<31:26:38, 6.89s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:18:09<31:26:38, 6.89s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:18:09<31:26:38, 6.89s/it]g-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:15,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:15,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3528, 'learning_rate': 2.927672209026128e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:15,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:15,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:15,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:14:44,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:18:22<31:04:08, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:18:22<31:04:08, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:18:22<31:04:08, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:18:22<31:04:08, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1409/17840 [2:18:29<30:55:42, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1409/17840 [2:18:29<30:55:42, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:33,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:33,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:18:36<30:45:51, 6.74s/it]g-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:18:36<30:45:51, 6.74s/it]g-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:18:36<30:45:51, 6.74s/it]g-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3251, 'learning_rate': 2.926959619952494e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:23,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:18:49<30:32:02, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:18:49<30:32:02, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:18:49<30:32:02, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:18:49<30:32:02, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1413/17840 [2:18:55<30:18:51, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:58,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:16:58,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:19:02<30:08:56, 6.61s/it]g-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:19:02<30:08:56, 6.61s/it]g-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2208, 'learning_rate': 2.9264251781472685e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:06,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:19:08<29:57:45, 6.57s/it]g-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:19:08<29:57:45, 6.57s/it]g-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2686, 'learning_rate': 2.92624703087886e-05, 'epoch': 1.59} + 8%|█████▊ | 1415/17840 [2:19:08<29:57:45, 6.57s/it]g-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:14,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:14,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0691, 'learning_rate': 2.926068883610451e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:14,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0945, 'learning_rate': 2.925890736342043e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:17:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:16:50,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:19:27<29:17:38, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:28,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:19:27<29:17:38, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:28,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:19:27<29:17:38, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:28,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:19:27<29:17:38, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:28,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:19:34<29:10:56, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:35,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:19:34<29:10:56, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:35,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:19:34<29:10:56, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:35,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:19:34<29:10:56, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:35,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:19:40<28:55:25, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:41,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:19:40<28:55:25, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:41,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:19:40<28:55:25, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:41,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:19:40<28:55:25, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:41,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:19:46<28:40:59, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:47,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:19:46<28:40:59, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:47,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:19:46<28:40:59, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:47,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:19:46<28:40:59, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:47,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:19:52<28:26:49, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:53,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:19:52<28:26:49, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:53,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:19:52<28:26:49, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:53,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:19:52<28:26:49, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:53,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:19:58<28:14:10, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:59,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:19:58<28:14:10, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:59,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:19:58<28:14:10, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:59,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:19:58<28:14:10, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:17:59,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:20:04<28:04:26, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:20:04<28:04:26, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:20:04<28:04:26, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:20:12<29:37:28, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:20:12<29:37:28, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.098, 'learning_rate': 2.9244655581947747e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:15,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1426/17840 [2:20:18<28:51:50, 6.33s/it]g-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1426/17840 [2:20:18<28:51:50, 6.33s/it]g-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0454, 'learning_rate': 2.924287410926366e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:21,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1427/17840 [2:20:23<28:04:39, 6.16s/it]g-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1427/17840 [2:20:23<28:04:39, 6.16s/it]g-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:26,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:26,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:26,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:05,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:20:29<27:26:02, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:20:29<27:26:02, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:34,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:34,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0791, 'learning_rate': 2.92375296912114e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:38,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:20:40<26:05:37, 5.72s/it]g-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:20:40<26:05:37, 5.72s/it]g-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:42,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:42,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:42,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1431/17840 [2:20:45<25:34:51, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1431/17840 [2:20:45<25:34:51, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:50,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:50,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:52,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:55,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:55,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3729, 'learning_rate': 2.923040380047506e-05, 'epoch': 1.61} +[WARNING|modeling_utils.py:388] 2022-03-15 22:18:58,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:18:46,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1434/17840 [2:21:00<23:06:33, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1434/17840 [2:21:00<23:06:33, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:02,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1435/17840 [2:21:04<22:00:48, 4.83s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1435/17840 [2:21:04<22:00:48, 4.83s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:05,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:07,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:07,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:09,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:11,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:11,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:14,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:14,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:16,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:18,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:18,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:20,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:20,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:22,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:22,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:24,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:24,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.7966, 'learning_rate': 2.921437054631829e-05, 'epoch': 1.62} +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:28,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:28,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:32,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:32,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3692, 'learning_rate': 2.9212589073634206e-05, 'epoch': 1.62} +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:35,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:35,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:35,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:39,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:43,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:43,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:21:47<26:13:18, 5.76s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:21:47<26:13:18, 5.76s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5859, 'learning_rate': 2.9209026128266035e-05, 'epoch': 1.62} + 8%|█████▉ | 1445/17840 [2:21:47<26:13:18, 5.76s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:53,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:53,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3247, 'learning_rate': 2.9207244655581947e-05, 'epoch': 1.62} +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:53,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:19:53,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:22:01<29:26:40, 6.47s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:22:01<29:26:40, 6.47s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.385, 'learning_rate': 2.920546318289786e-05, 'epoch': 1.62} + 8%|█████▉ | 1447/17840 [2:22:01<29:26:40, 6.47s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:22:01<29:26:40, 6.47s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:22:01<29:26:40, 6.47s/it]g-point operations will not be computed-15 22:19:00,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:22:08<30:18:05, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:22:08<30:18:05, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:22:08<30:18:05, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:22:08<30:18:05, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:22:15<30:48:29, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:22:15<30:48:29, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:22:15<30:48:29, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:22:15<30:48:29, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:22:15<30:48:29, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:22:24<32:49:36, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:22:24<32:49:36, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:22:24<32:49:36, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:30,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:30,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2429, 'learning_rate': 2.919833729216152e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:30,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:30,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:30,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1452/17840 [2:22:38<32:24:28, 7.12s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:40,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:40,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:40,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:22:45<32:06:35, 7.05s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:22:45<32:06:35, 7.05s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:22:45<32:06:35, 7.05s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:22:45<32:06:35, 7.05s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:22:45<32:06:35, 7.05s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1454/17840 [2:22:52<31:57:02, 7.02s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:54,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:54,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:20:54,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:22:58<31:38:07, 6.95s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:22:58<31:38:07, 6.95s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:03,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:23:05<31:10:47, 6.85s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:23:05<31:10:47, 6.85s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2399, 'learning_rate': 2.9189429928741094e-05, 'epoch': 1.63} + 8%|█████▉ | 1456/17840 [2:23:05<31:10:47, 6.85s/it]g-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:11,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:11,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2841, 'learning_rate': 2.918764845605701e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:11,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:11,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:11,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:20:09,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:23:18<30:35:25, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:23:18<30:35:25, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:23:18<30:35:25, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:23:18<30:35:25, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:23:25<30:26:58, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:23:25<30:26:58, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:29,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:29,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:23:31<30:11:31, 6.64s/it]g-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:23:31<30:11:31, 6.64s/it]g-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:23:31<30:11:31, 6.64s/it]g-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:37,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:37,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1396, 'learning_rate': 2.9180522565320668e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:37,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:43,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:43,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3341, 'learning_rate': 2.917874109263658e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:43,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:50,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:50,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1586, 'learning_rate': 2.9176959619952494e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:50,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:50,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:21:50,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:21:19,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:23:57<29:28:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:58,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:23:57<29:28:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:58,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:23:57<29:28:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:58,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:23:57<29:28:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:21:58,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:24:04<29:21:55, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:04,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:24:04<29:21:55, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:04,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:24:04<29:21:55, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:04,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:24:04<29:21:55, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:04,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:24:10<29:05:00, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:24:10<29:05:00, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:24:10<29:05:00, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:24:10<29:05:00, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:24:16<28:51:38, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:18,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:18,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:18,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:24:22<28:39:13, 6.30s/it]g-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:24,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:24,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:24,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:24:28<28:28:24, 6.26s/it]g-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:31,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:31,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:31,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1470/17840 [2:24:35<28:19:26, 6.23s/it]g-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:37,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:37,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:37,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1471/17840 [2:24:41<28:04:22, 6.17s/it]g-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:43,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:43,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:43,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1472/17840 [2:24:47<27:51:42, 6.13s/it]g-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:49,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:49,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:22:49,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:11,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:24:53<27:42:55, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:53,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:24:53<27:42:55, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:53,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:24:53<27:42:55, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:53,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:24:53<27:42:55, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:53,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:24:58<27:26:29, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:24:58<27:26:29, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:24:58<27:26:29, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:25:06<28:40:34, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:25:06<28:40:34, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0589, 'learning_rate': 2.9155581947743468e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:09,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1476/17840 [2:25:11<28:01:19, 6.16s/it]g-point operations will not be computed-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1476/17840 [2:25:11<28:01:19, 6.16s/it]g-point operations will not be computed-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:13,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:13,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:13,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:22:59,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1477/17840 [2:25:17<27:09:47, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1477/17840 [2:25:17<27:09:47, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:21,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:21,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0869, 'learning_rate': 2.9150237529691212e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:26,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:25:28<25:56:40, 5.71s/it]g-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:25:28<25:56:40, 5.71s/it]g-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:30,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:30,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:30,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:17,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1480/17840 [2:25:33<25:17:31, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:23:33,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1480/17840 [2:25:33<25:17:31, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:23:33,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:37,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:33,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:37,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:33,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0136, 'learning_rate': 2.9144893111638956e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:41,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:33,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:41,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:33,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1482/17840 [2:25:43<24:00:57, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:46,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1483/17840 [2:25:48<23:15:00, 5.12s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1483/17840 [2:25:48<23:15:00, 5.12s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:49,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:51,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:51,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:54,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:56,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:56,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:23:58,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:00,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:00,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:02,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:03,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:03,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:05,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:05,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:08,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:10,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:10,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:12,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:12,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:14,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:14,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:16,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:16,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:17,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:21,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:21,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:24,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:24,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5052, 'learning_rate': 2.912351543942993e-05, 'epoch': 1.67} +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:28,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:28,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:32,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:32,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3481, 'learning_rate': 2.9121733966745845e-05, 'epoch': 1.67} +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:37,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:26:40<26:07:23, 5.75s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:26:40<26:07:23, 5.75s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3631, 'learning_rate': 2.911995249406176e-05, 'epoch': 1.68} + 8%|██████ | 1495/17840 [2:26:40<26:07:23, 5.75s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:26:40<26:07:23, 5.75s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:26:47<27:54:02, 6.15s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:26:47<27:54:02, 6.15s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:50,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:50,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:24:50,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:26:54<29:18:05, 6.45s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:26:54<29:18:05, 6.45s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:26:54<29:18:05, 6.45s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:26:54<29:18:05, 6.45s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:26:54<29:18:05, 6.45s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:27:01<30:09:37, 6.64s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:25:04,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:25:04,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-15 22:25:04,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:27:08<30:48:09, 6.79s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:27:08<30:48:09, 6.79s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:27:08<30:48:09, 6.79s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:27:08<30:48:09, 6.79s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:27:08<30:48:09, 6.79s/it]g-point operations will not be computed-15 22:23:43,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2366] 2022-03-15 22:25:16,174 >> Num examples = 2642 | 1500/17840 [2:27:16<32:50:38, 7.24s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|trainer.py:2366] 2022-03-15 22:25:16,174 >> Num examples = 2642 | 1500/17840 [2:27:16<32:50:38, 7.24s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|trainer.py:2366] 2022-03-15 22:25:16,174 >> Num examples = 2642 | 1500/17840 [2:27:16<32:50:38, 7.24s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|▊ | 3/331 [00:05<09:40, 1.77s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|█ | 4/331 [00:07<10:53, 2.00s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▎ | 5/331 [00:11<13:52, 2.55s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▌ | 6/331 [00:14<15:50, 2.93s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▊ | 7/331 [00:17<15:40, 2.90s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|██ | 8/331 [00:21<16:33, 3.07s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▎ | 9/331 [00:24<17:42, 3.30s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▍ | 10/331 [00:29<19:51, 3.71s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▋ | 11/331 [00:32<18:38, 3.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|██▉ | 12/331 [00:35<17:55, 3.37s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▏ | 13/331 [00:38<17:20, 3.27s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▍ | 14/331 [00:41<16:59, 3.22s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▋ | 15/331 [00:46<19:56, 3.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▉ | 16/331 [00:51<22:04, 4.21s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▏ | 17/331 [00:56<22:36, 4.32s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▍ | 18/331 [00:58<19:26, 3.73s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▋ | 19/331 [01:02<19:08, 3.68s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▉ | 20/331 [01:04<16:56, 3.27s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|█████▏ | 21/331 [01:09<18:26, 3.57s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▍ | 22/331 [01:14<20:49, 4.04s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▋ | 23/331 [01:20<23:46, 4.63s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▉ | 24/331 [01:26<26:02, 5.09s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▏ | 25/331 [01:30<24:25, 4.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▍ | 26/331 [01:33<21:39, 4.26s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▋ | 27/331 [01:38<22:02, 4.35s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▉ | 28/331 [01:41<21:00, 4.16s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▏ | 29/331 [01:45<20:08, 4.00s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|█████��█▍ | 30/331 [01:48<18:36, 3.71s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▋ | 31/331 [01:51<17:19, 3.46s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|███████▉ | 32/331 [01:54<16:43, 3.35s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▏ | 33/331 [01:57<16:49, 3.39s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▍ | 34/331 [02:01<16:55, 3.42s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▋ | 35/331 [02:05<17:21, 3.52s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▉ | 36/331 [02:09<18:58, 3.86s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▏ | 37/331 [02:14<20:43, 4.23s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▍ | 38/331 [02:19<21:16, 4.36s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▋ | 39/331 [02:24<21:28, 4.41s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▉ | 40/331 [02:26<18:27, 3.80s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|██████████▏ | 41/331 [02:29<17:00, 3.52s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▍ | 42/331 [02:34<19:09, 3.98s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▋ | 43/331 [02:39<20:52, 4.35s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▉ | 44/331 [02:44<21:52, 4.57s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▏ | 45/331 [02:48<20:03, 4.21s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▍ | 46/331 [02:50<17:27, 3.67s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▋ | 47/331 [02:52<15:31, 3.28s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|███████████▉ | 48/331 [02:56<16:14, 3.44s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▏ | 49/331 [03:01<17:49, 3.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▍ | 50/331 [03:05<17:44, 3.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▋ | 51/331 [03:09<18:31, 3.97s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|████████████▉ | 52/331 [03:12<17:11, 3.70s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▏ | 53/331 [03:16<17:15, 3.73s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▍ | 54/331 [03:19<15:52, 3.44s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▋ | 55/331 [03:24<18:14, 3.97s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▊ | 56/331 [03:27<17:50, 3.89s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|██████████████ | 57/331 [03:31<17:07, 3.75s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▎ | 58/331 [03:36<18:22, 4.04s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▌ | 59/331 [03:38<16:35, 3.66s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▊ | 60/331 [03:41<15:47, 3.50s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|███████████████ | 61/331 [03:46<16:53, 3.75s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▎ | 62/331 [03:49<16:14, 3.62s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▌ | 63/331 [03:55<18:35, 4.16s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▊ | 64/331 [03:58<17:21, 3.90s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████ | 65/331 [04:01<16:51, 3.80s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▎ | 66/331 [04:08<19:50, 4.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▌ | 67/331 [04:13<21:01, 4.78s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|████████████████▊ | 68/331 [04:18<21:14, 4.85s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████ | 69/331 [04:22<20:33, 4.71s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▎ | 70/331 [04:27<20:14, 4.65s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▌ | 71/331 [04:32<20:44, 4.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|█████████████████▊ | 72/331 [04:37<20:38, 4.78s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████ | 73/331 [04:41<19:28, 4.53s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████▎ | 74/331 [04:45<19:08, 4.47s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▌ | 75/331 [04:50<19:51, 4.65s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▊ | 76/331 [04:54<18:25, 4.33s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|███████████████████ | 77/331 [04:58<17:43, 4.19s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▎ | 78/331 [05:01<16:14, 3.85s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▌ | 79/331 [05:04<15:21, 3.66s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▊ | 80/331 [05:07<15:13, 3.64s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|████████████████████ | 81/331 [05:12<16:19, 3.92s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▎ | 82/331 [05:16<15:53, 3.83s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▌ | 83/331 [05:20<16:43, 4.05s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▊ | 84/331 [05:26<18:54, 4.59s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████ | 85/331 [05:29<16:44, 4.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▎ | 86/331 [05:34<18:11, 4.45s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▌ | 87/331 [05:38<17:19, 4.26s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|█████████████████████▊ | 88/331 [05:42<16:32, 4.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████ | 89/331 [05:44<14:37, 3.63s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▎ | 90/331 [05:47<13:32, 3.37s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▌ | 91/331 [05:52<14:53, 3.72s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|██████████████████████▊ | 92/331 [05:54<13:13, 3.32s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████ | 93/331 [05:58<13:35, 3.43s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████▎ | 94/331 [06:02<14:06, 3.57s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▌ | 95/331 [06:05<14:19, 3.64s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▊ | 96/331 [06:09<14:30, 3.70s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|████████████████████████ | 97/331 [06:12<13:32, 3.47s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▎ | 98/331 [06:17<14:32, 3.74s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▌ | 99/331 [06:20<14:29, 3.75s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▍ | 100/331 [06:23<13:31, 3.51s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▋ | 101/331 [06:27<13:26, 3.51s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▉ | 102/331 [06:32<15:16, 4.00s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▏ | 103/331 [06:35<14:05, 3.71s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▍ | 104/331 [06:39<13:55, 3.68s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▋ | 105/331 [06:42<13:57, 3.70s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▉ | 106/331 [06:46<13:56, 3.72s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|██████████████████████████▏ | 107/331 [06:48<12:18, 3.30s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▍ | 108/331 [06:51<11:52, 3.20s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▋ | 109/331 [06:54<11:45, 3.18s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▉ | 110/331 [06:59<13:06, 3.56s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▏ | 111/331 [07:03<13:18, 3.63s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▍ | 112/331 [07:06<13:24, 3.67s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▋ | 113/331 [07:09<12:19, 3.39s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▉ | 114/331 [07:13<12:36, 3.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▏ | 115/331 [07:17<12:45, 3.54s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▍ | 116/331 [07:21<13:28, 3.76s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▋ | 117/331 [07:25<13:25, 3.76s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|████████████████████████████▉ | 118/331 [07:28<12:40, 3.57s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████ | 119/331 [07:31<12:38, 3.58s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████▎ | 120/331 [07:35<12:42, 3.61s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▌ | 121/331 [07:40<13:53, 3.97s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▊ | 122/331 [07:43<13:21, 3.83s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████ | 123/331 [07:49<14:43, 4.25s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████▎ | 124/331 [07:52<14:18, 4.15s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▌ | 125/331 [07:58<15:27, 4.50s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▊ | 126/331 [08:03<15:40, 4.59s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|███████████████████████████████ | 127/331 [08:08<16:26, 4.84s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▎ | 128/331 [08:13<16:35, 4.90s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▌ | 129/331 [08:18<16:07, 4.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▊ | 130/331 [08:23<16:24, 4.90s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████ | 131/331 [08:28<16:45, 5.03s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▎ | 132/331 [08:32<15:27, 4.66s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▌ | 133/331 [08:35<13:52, 4.20s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▊ | 134/331 [08:39<13:15, 4.04s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████ | 135/331 [08:43<13:40, 4.18s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▎ | 136/331 [08:48<14:25, 4.44s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▌ | 137/331 [08:53<15:05, 4.67s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|█████████████████████████████████▊ | 138/331 [08:59<15:32, 4.83s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████ | 139/331 [09:01<13:02, 4.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████ | 139/331 [09:01<13:02, 4.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████ | 139/331 [09:01<13:02, 4.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▌ | 141/331 [09:10<13:37, 4.30s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▋ | 142/331 [09:14<12:49, 4.07s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▉ | 143/331 [09:19<13:46, 4.39s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▏ | 144/331 [09:23<13:02, 4.19s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▍ | 145/331 [09:27<12:43, 4.11s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|████████████████████��██████████████▋ | 146/331 [09:32<13:44, 4.46s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▉ | 147/331 [09:36<13:02, 4.25s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▏ | 148/331 [09:39<11:44, 3.85s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▍ | 149/331 [09:41<10:43, 3.54s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▋ | 150/331 [09:46<11:37, 3.85s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|████████████████████████████████████▉ | 151/331 [09:50<11:23, 3.80s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▏ | 152/331 [09:53<10:28, 3.51s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▍ | 153/331 [09:56<10:05, 3.40s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▋ | 154/331 [10:00<11:08, 3.78s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▉ | 155/331 [10:05<12:12, 4.16s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████��███████████████▏ | 156/331 [10:10<12:52, 4.41s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▍ | 157/331 [10:16<13:31, 4.67s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▋ | 158/331 [10:21<13:47, 4.78s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▉ | 159/331 [10:26<13:49, 4.82s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▉ | 159/331 [10:26<13:49, 4.82s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▉ | 159/331 [10:26<13:49, 4.82s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▍ | 161/331 [10:33<12:01, 4.24s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▋ | 162/331 [10:38<12:49, 4.55s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▉ | 163/331 [10:43<13:01, 4.65s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▏ | 164/331 [10:47<12:10, 4.37s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|█████████���██████████████████████████████▍ | 165/331 [10:51<11:42, 4.23s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▌ | 166/331 [10:55<11:14, 4.09s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▊ | 167/331 [10:59<11:42, 4.28s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████ | 168/331 [11:02<10:39, 3.92s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▎ | 169/331 [11:07<11:01, 4.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▌ | 170/331 [11:10<10:06, 3.77s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|█████████████████████████████████████████▊ | 171/331 [11:14<10:01, 3.76s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████ | 172/331 [11:16<08:40, 3.27s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████▎ | 173/331 [11:20<09:21, 3.56s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▌ | 174/331 [11:23<08:50, 3.38s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▊ | 175/331 [11:27<09:09, 3.52s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████ | 176/331 [11:30<08:42, 3.37s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████▎ | 177/331 [11:34<09:39, 3.76s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▌ | 178/331 [11:40<10:42, 4.20s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▊ | 179/331 [11:45<11:28, 4.53s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|████████████████████████████████████████████ | 180/331 [11:49<11:17, 4.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▎ | 181/331 [11:54<11:09, 4.46s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▌ | 182/331 [11:57<09:49, 3.96s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▊ | 183/331 [11:59<08:37, 3.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████ | 184/331 [12:01<07:43, 3.15s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▎ | 185/331 [12:03<06:54, 2.84s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▌ | 186/331 [12:07<07:27, 3.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▊ | 187/331 [12:12<08:46, 3.66s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████ | 188/331 [12:16<08:43, 3.66s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▎ | 189/331 [12:18<07:59, 3.38s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▍ | 190/331 [12:21<07:29, 3.18s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▋ | 191/331 [12:24<07:18, 3.13s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▉ | 192/331 [12:27<06:57, 3.00s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|███████████████████████████████████████████████▏ | 193/331 [12:32<08:01, 3.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▍ | 194/331 [12:34<07:14, 3.17s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▋ | 195/331 [12:37<06:58, 3.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▉ | 196/331 [12:40<07:14, 3.22s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▏ | 197/331 [12:45<07:56, 3.56s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▍ | 198/331 [12:47<07:17, 3.29s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▋ | 199/331 [12:51<07:30, 3.41s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▉ | 200/331 [12:53<06:46, 3.10s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▏ | 201/331 [12:56<06:37, 3.06s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▍ | 202/331 [13:00<07:00, 3.26s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▋ | 203/331 [13:04<07:09, 3.35s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|█████████████████████████████████████████████████▉ | 204/331 [13:08<07:55, 3.75s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▏ | 205/331 [13:13<08:09, 3.89s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▍ | 206/331 [13:16<07:59, 3.84s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▋ | 207/331 [13:21<08:39, 4.19s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▉ | 208/331 [13:26<08:52, 4.33s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▏ | 209/331 [13:28<07:37, 3.75s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▍ | 210/331 [13:31<06:43, 3.34s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▋ | 211/331 [13:34<06:54, 3.46s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▉ | 212/331 [13:37<06:24, 3.23s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|████████████████████████████████████████████████████ | 213/331 [13:41<06:30, 3.31s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▎ | 214/331 [13:43<05:53, 3.02s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▌ | 215/331 [13:45<05:24, 2.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▊ | 216/331 [13:50<06:37, 3.46s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████ | 217/331 [13:54<06:35, 3.47s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▎ | 218/331 [13:58<07:11, 3.82s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▌ | 219/331 [14:02<07:02, 3.77s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▊ | 220/331 [14:05<06:31, 3.52s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████ | 221/331 [14:09<06:37, 3.61s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▎ | 222/331 [14:12<06:07, 3.37s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▌ | 223/331 [14:15<06:15, 3.48s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|██████████████████████████████████████████████████████▊ | 224/331 [14:19<06:20, 3.56s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████ | 225/331 [14:23<06:21, 3.60s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████▎ | 226/331 [14:28<06:59, 4.00s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▌ | 227/331 [14:31<06:45, 3.90s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▊ | 228/331 [14:35<06:27, 3.76s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████ | 229/331 [14:38<06:18, 3.71s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████▎ | 230/331 [14:42<05:56, 3.53s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▌ | 231/331 [14:46<06:16, 3.77s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████���███████████████████████████████████████▊ | 232/331 [14:49<06:06, 3.71s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|█████████████████████████████████████████████████████████ | 233/331 [14:54<06:25, 3.93s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▎ | 234/331 [14:57<05:51, 3.62s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▌ | 235/331 [15:00<05:28, 3.42s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▊ | 236/331 [15:06<06:34, 4.16s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|█████████████████████████████████████████████████████████▉ | 237/331 [15:11<07:00, 4.47s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▏ | 238/331 [15:15<06:53, 4.45s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▍ | 239/331 [15:20<06:52, 4.48s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▋ | 240/331 [15:25<07:03, 4.66s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▉ | 241/331 [15:30<07:13, 4.81s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▏ | 242/331 [15:35<07:14, 4.88s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▍ | 243/331 [15:40<07:10, 4.89s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▋ | 244/331 [15:45<07:16, 5.02s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▉ | 245/331 [15:50<06:55, 4.83s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|████████████████████████████████████████████████████████████▏ | 246/331 [15:56<07:22, 5.20s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▍ | 247/331 [16:00<06:58, 4.98s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▋ | 248/331 [16:04<06:17, 4.55s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▉ | 249/331 [16:07<05:30, 4.03s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▏ | 250/331 [16:10<05:01, 3.72s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▍ | 251/331 [16:14<05:11, 3.90s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▋ | 252/331 [16:17<04:44, 3.60s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▉ | 253/331 [16:22<05:08, 3.95s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▏ | 254/331 [16:25<04:54, 3.83s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▍ | 255/331 [16:30<05:11, 4.09s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▋ | 256/331 [16:33<04:54, 3.93s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|██████████████████████████████████████████████████████████████▉ | 257/331 [16:38<05:05, 4.13s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▏ | 258/331 [16:41<04:33, 3.74s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▍ | 259/331 [16:44<04:25, 3.69s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▋ | 260/331 [16:49<04:34, 3.87s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▊ | 261/331 [16:51<04:00, 3.44s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████ | 262/331 [16:55<04:01, 3.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████▎ | 263/331 [16:59<04:22, 3.87s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▌ | 264/331 [17:03<04:03, 3.64s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [17:06<03:50, 3.49s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|█████████████████████████████████████████████████████████████████ | 266/331 [17:09<03:38, 3.36s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▎ | 267/331 [17:14<04:02, 3.79s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▌ | 268/331 [17:17<03:56, 3.76s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▊ | 269/331 [17:22<04:18, 4.16s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████ | 270/331 [17:26<04:09, 4.08s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▎ | 271/331 [17:31<04:22, 4.38s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▌ | 272/331 [17:35<04:03, 4.12s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [17:39<03:59, 4.13s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████ | 274/331 [17:44<04:13, 4.45s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▎ | 275/331 [17:49<04:13, 4.54s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▌ | 276/331 [17:52<03:46, 4.12s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|███████████████████████████████████████████████████████████████████▊ | 277/331 [17:56<03:35, 4.00s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████ | 278/331 [18:00<03:28, 3.93s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████▎ | 279/331 [18:05<03:55, 4.53s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▌ | 280/331 [18:09<03:42, 4.36s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▊ | 281/331 [18:15<03:49, 4.58s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████ | 282/331 [18:19<03:43, 4.57s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████▎ | 283/331 [18:24<03:47, 4.75s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▍ | 284/331 [18:30<03:50, 4.90s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▋ | 285/331 [18:35<03:49, 4.99s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▉ | 286/331 [18:40<03:47, 5.05s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▏ | 287/331 [18:46<03:54, 5.32s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▍ | 288/331 [18:51<03:47, 5.28s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [18:55<03:22, 4.82s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|██████████████████████████████████████████████████████████████████████▉ | 290/331 [18:58<03:02, 4.44s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▏ | 291/331 [19:01<02:41, 4.03s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▍ | 292/331 [19:05<02:31, 3.88s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▋ | 293/331 [19:09<02:26, 3.85s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▉ | 294/331 [19:12<02:11, 3.56s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████���████▏ | 295/331 [19:15<02:02, 3.40s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▍ | 296/331 [19:17<01:51, 3.18s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▋ | 297/331 [19:23<02:09, 3.82s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▉ | 298/331 [19:28<02:21, 4.29s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [19:32<02:10, 4.09s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▍ | 300/331 [19:36<02:05, 4.04s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▋ | 301/331 [19:39<01:58, 3.95s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▉ | 302/331 [19:43<01:50, 3.82s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▏ | 303/331 [19:46<01:40, 3.58s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▍ | 304/331 [19:50<01:43, 3.83s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▋ | 305/331 [19:55<01:46, 4.11s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▉ | 306/331 [20:00<01:51, 4.47s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▏ | 307/331 [20:06<01:53, 4.73s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▎ | 308/331 [20:11<01:55, 5.03s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▌ | 309/331 [20:17<01:52, 5.13s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|███████████████████████████████████████████████████████████████████████████▊ | 310/331 [20:20<01:35, 4.56s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████ | 311/331 [20:25<01:32, 4.60s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████▎ | 312/331 [20:28<01:18, 4.16s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▌ | 313/331 [20:32<01:12, 4.03s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▊ | 314/331 [20:36<01:11, 4.21s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████ | 315/331 [20:41<01:10, 4.41s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████▎ | 316/331 [20:46<01:06, 4.46s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▌ | 317/331 [20:51<01:06, 4.72s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▊ | 318/331 [20:54<00:55, 4.26s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|██████████████████████████████████████████████████████████████████████████████ | 319/331 [20:57<00:47, 3.94s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▎ | 320/331 [21:02<00:44, 4.06s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▌ | 321/331 [21:05<00:39, 3.98s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [21:11<00:39, 4.34s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████ | 323/331 [21:14<00:33, 4.15s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [21:19<00:31, 4.44s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▌ | 325/331 [21:24<00:27, 4.50s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▊ | 326/331 [21:29<00:22, 4.59s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████ | 327/331 [21:34<00:18, 4.59s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▎| 328/331 [21:38<00:14, 4.71s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▌| 329/331 [21:43<00:09, 4.57s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [21:48<00:04, 4.84s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [21:48<00:04, 4.84s/it][INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/15/2022 22:47:10 - INFO - datasets.metric - Removing /home/sanchit_huggingface_co/.cache/huggingface/metrics/wer/default/default_experiment-1-0.arrow +[INFO|configuration_utils.py:438] 2022-03-15 22:47:10,335 >> Configuration saved in ./checkpoint-1500/config.json [INFO|trainer.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-15 22:47:15,091 >> Configuration saved in ./checkpoint-1500/preprocessor_config.jsoner.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-15 22:47:15,091 >> Configuration saved in ./checkpoint-1500/preprocessor_config.jsoner.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-15 22:47:15,091 >> Configuration saved in ./checkpoint-1500/preprocessor_config.jsoner.py:560] 2022-03-15 22:25:16,172 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/15/2022 22:47:33 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20220315_195757-3ex43zbl/run-3ex43zbl.wandb']. This may take a bit of time if the files are large.