diff --git "a/wandb/run-20220302_114207-c11kvzxa/files/output.log" "b/wandb/run-20220302_114207-c11kvzxa/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220302_114207-c11kvzxa/files/output.log" @@ -0,0 +1,2292 @@ + + + 0%| | 0/892 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:12,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:14,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:16,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 1/892 [00:08<1:59:05, 8.02s/it] + 0%| | 1/892 [00:08<1:59:05, 8.02s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:42:18,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:20,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:21,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0803, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:23,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%|▏ | 2/892 [00:15<1:53:53, 7.68s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:42:25,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:27,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:29,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9484, 'learning_rate': 6e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:31,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%|▎ | 3/892 [00:22<1:51:42, 7.54s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:42:33,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:34,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:36,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.938, 'learning_rate': 1.2e-06, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:38,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%|▎ | 4/892 [00:29<1:48:57, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:42:40,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:41,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:43,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7551, 'learning_rate': 1.8e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:45,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▍ | 5/892 [00:37<1:47:24, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:42:47,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:49,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:50,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8735, 'learning_rate': 2.4e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:52,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▌ | 6/892 [00:44<1:46:56, 7.24s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:42:54,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:56,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:57,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8362, 'learning_rate': 2.9999999999999997e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-02 11:42:59,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 7/892 [00:51<1:45:47, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:01,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:03,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:04,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7153, 'learning_rate': 3.6e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▋ | 8/892 [00:58<1:45:00, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:08,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:10,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:11,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.845, 'learning_rate': 4.2e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:13,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 9/892 [01:05<1:44:21, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:15,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:17,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:18,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6926, 'learning_rate': 4.8e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:20,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▉ | 10/892 [01:12<1:43:50, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:22,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:24,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:25,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:27,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 11/892 [01:19<1:42:46, 7.00s/it] + + 1%|▉ | 11/892 [01:19<1:42:46, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:29,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:31,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:32,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6924, 'learning_rate': 5.999999999999999e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:34,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 12/892 [01:26<1:42:12, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:36,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:37,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:39,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:41,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 13/892 [01:32<1:41:39, 6.94s/it] + + 1%|█▏ | 13/892 [01:32<1:41:39, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:43,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:44,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:46,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:48,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 14/892 [01:39<1:41:19, 6.92s/it] + + 2%|█▎ | 14/892 [01:39<1:41:19, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:50,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:51,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:53,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4967, 'learning_rate': 7.799999999999998e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:55,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 2%|█▎ | 15/892 [01:46<1:40:59, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:43:56,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:43:58,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:00,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:01,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 16/892 [01:53<1:40:09, 6.86s/it] + + 2%|█▍ | 16/892 [01:53<1:40:09, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:03,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:05,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:06,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:08,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 17/892 [02:00<1:39:12, 6.80s/it] + + 2%|█▌ | 17/892 [02:00<1:39:12, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:10,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:11,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:13,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:15,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 18/892 [02:06<1:38:19, 6.75s/it] + + 2%|█▌ | 18/892 [02:06<1:38:19, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:16,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:18,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:20,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3842, 'learning_rate': 1.02e-05, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:21,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 19/892 [02:13<1:37:51, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:23,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:25,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:26,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:28,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 20/892 [02:20<1:37:23, 6.70s/it] + 2%|█▊ | 20/892 [02:20<1:37:23, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:30,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:31,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:33,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:34,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 21/892 [02:26<1:36:01, 6.62s/it] + + 2%|█▉ | 21/892 [02:26<1:36:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:36,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:38,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:39,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:41,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 22/892 [02:32<1:35:08, 6.56s/it] + + 2%|█▉ | 22/892 [02:32<1:35:08, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:42,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:44,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:46,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:47,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 23/892 [02:39<1:34:11, 6.50s/it] + + 3%|██ | 23/892 [02:39<1:34:11, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:49,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:50,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:52,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:54,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5379, 'learning_rate': 1.3199999999999997e-05, 'epoch': 0.03} + 3%|██▏ | 24/892 [02:45<1:33:40, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:44:55,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:57,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:44:58,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4186, 'learning_rate': 1.3799999999999998e-05, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:00,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:04,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:02,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:04,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:02,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:05,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:07,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 26/892 [02:58<1:33:48, 6.50s/it] + 3%|██▎ | 26/892 [02:58<1:33:48, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:08,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:10,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:11,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:08,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 27/892 [03:04<1:32:22, 6.41s/it]g-point operations will not be computed-02 11:45:08,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 27/892 [03:04<1:32:22, 6.41s/it]g-point operations will not be computed-02 11:45:08,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 27/892 [03:04<1:32:22, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:17,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 28/892 [03:11<1:31:04, 6.32s/it]g-point operations will not be computed-02 11:45:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 28/892 [03:11<1:31:04, 6.32s/it]g-point operations will not be computed-02 11:45:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 28/892 [03:11<1:31:04, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:21,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:24,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:21,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 29/892 [03:17<1:30:15, 6.28s/it]g-point operations will not be computed-02 11:45:21,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 29/892 [03:17<1:30:15, 6.28s/it]g-point operations will not be computed-02 11:45:21,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 29/892 [03:17<1:30:15, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:27,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:30,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:27,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 30/892 [03:23<1:29:29, 6.23s/it]g-point operations will not be computed-02 11:45:27,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 30/892 [03:23<1:29:29, 6.23s/it]g-point operations will not be computed-02 11:45:27,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 30/892 [03:23<1:29:29, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:33,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:36,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:33,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▊ | 31/892 [03:29<1:28:34, 6.17s/it]g-point operations will not be computed-02 11:45:33,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▊ | 31/892 [03:29<1:28:34, 6.17s/it]g-point operations will not be computed-02 11:45:33,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▊ | 31/892 [03:29<1:28:34, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:39,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:42,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:39,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:35<1:27:17, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:45,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:35<1:27:17, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:45,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2016, 'learning_rate': 1.7999999999999997e-05, 'epoch': 0.04} + 4%|██▉ | 33/892 [03:41<1:26:03, 6.01s/it]g-point operations will not be computed-02 11:45:45,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:41<1:26:03, 6.01s/it]g-point operations will not be computed-02 11:45:45,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:41<1:26:03, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:50,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:53,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:50,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 34/892 [03:46<1:24:20, 5.90s/it]g-point operations will not be computed-02 11:45:50,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 34/892 [03:46<1:24:20, 5.90s/it]g-point operations will not be computed-02 11:45:50,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 34/892 [03:46<1:24:20, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:45:56,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:45:59,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:45:56,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 35/892 [03:52<1:22:33, 5.78s/it]g-point operations will not be computed-02 11:45:56,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 35/892 [03:52<1:22:33, 5.78s/it]g-point operations will not be computed-02 11:45:56,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 35/892 [03:52<1:22:33, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:02,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:04,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:02,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:04,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:02,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [03:57<1:20:59, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [03:57<1:20:59, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 37/892 [04:03<1:19:30, 5.58s/it]g-point operations will not be computed-02 11:46:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 37/892 [04:03<1:19:30, 5.58s/it]g-point operations will not be computed-02 11:46:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 37/892 [04:03<1:19:30, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:12,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:15,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:12,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:08<1:17:58, 5.48s/it]g-point operations will not be computed-02 11:46:12,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:08<1:17:58, 5.48s/it]g-point operations will not be computed-02 11:46:12,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:08<1:17:58, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:18,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:20,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:18,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:20,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:18,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 39/892 [04:13<1:16:31, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:23,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:25,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:23,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▌ | 40/892 [04:18<1:14:34, 5.25s/it]g-point operations will not be computed-02 11:46:23,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▌ | 40/892 [04:18<1:14:34, 5.25s/it]g-point operations will not be computed-02 11:46:23,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▌ | 40/892 [04:18<1:14:34, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:28,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:23<1:12:44, 5.13s/it]g-point operations will not be computed-02 11:46:28,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:23<1:12:44, 5.13s/it]g-point operations will not be computed-02 11:46:28,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:23<1:12:44, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:32,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:35,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:32,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:27<1:10:15, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:37,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:27<1:10:15, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:37,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:39,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:37,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:39,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:37,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 43/892 [04:32<1:07:32, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:41,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:43,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:41,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:43,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:41,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 44/892 [04:36<1:03:52, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:45,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 45/892 [04:39<59:21, 4.20s/it]g-point operations will not be computed-02 11:46:45,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 45/892 [04:39<59:21, 4.20s/it]g-point operations will not be computed-02 11:46:45,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:50,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:48,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 46/892 [04:42<54:35, 3.87s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:51,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 46/892 [04:42<54:35, 3.87s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:46:51,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▎ | 47/892 [04:45<50:02, 3.55s/it]g-point operations will not be computed-02 11:46:51,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▎ | 47/892 [04:45<50:02, 3.55s/it]g-point operations will not be computed-02 11:46:51,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 48/892 [04:47<45:33, 3.24s/it]g-point operations will not be computed-02 11:46:54,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 48/892 [04:47<45:33, 3.24s/it]g-point operations will not be computed-02 11:46:54,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:58,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:56,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:46:58,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:56,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:00,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:46:59,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:52<40:11, 2.86s/it]g-point operations will not be computed-02 11:46:59,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:52<40:11, 2.86s/it]g-point operations will not be computed-02 11:46:59,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:52<40:11, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:03,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:52<40:11, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:03,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:06,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:03,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:06,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:03,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 51/892 [05:00<59:35, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:10,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 51/892 [05:00<59:35, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:10,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:14,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:10,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:14,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:10,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [05:07<1:11:56, 5.14s/it]g-point operations will not be computed-02 11:47:10,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [05:07<1:11:56, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [05:07<1:11:56, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:21,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:21,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:14<1:20:34, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:25,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:14<1:20:34, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:25,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:28,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:25,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:28,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:25,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 54/892 [05:21<1:25:46, 6.14s/it]g-point operations will not be computed-02 11:47:25,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 54/892 [05:21<1:25:46, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:32,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 54/892 [05:21<1:25:46, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:32,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:28<1:29:20, 6.40s/it]g-point operations will not be computed-02 11:47:32,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:28<1:29:20, 6.40s/it]g-point operations will not be computed-02 11:47:32,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:28<1:29:20, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:39,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:28<1:29:20, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:39,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:42,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:39,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:42,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:39,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:36<1:32:17, 6.62s/it]g-point operations will not be computed-02 11:47:39,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:36<1:32:17, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:46,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:36<1:32:17, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:46,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:36<1:32:17, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:46,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:43<1:33:53, 6.75s/it]g-point operations will not be computed-02 11:47:46,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:43<1:33:53, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:53,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:43<1:33:53, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:47:53,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:56,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:53,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:47:56,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:47:53,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:49<1:34:36, 6.81s/it]g-point operations will not be computed-02 11:47:53,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:49<1:34:36, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:00,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:03,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:00,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:03,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:00,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [05:56<1:34:36, 6.81s/it]g-point operations will not be computed-02 11:48:00,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [05:56<1:34:36, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:07,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [05:56<1:34:36, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:07,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [06:03<1:34:48, 6.84s/it]g-point operations will not be computed-02 11:48:07,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [06:03<1:34:48, 6.84s/it]g-point operations will not be computed-02 11:48:07,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [06:03<1:34:48, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [06:03<1:34:48, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:17,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:17,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:10<1:34:40, 6.84s/it]g-point operations will not be computed-02 11:48:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:10<1:34:40, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:20,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:23,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:20,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:23,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:20,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:17<1:34:08, 6.81s/it]g-point operations will not be computed-02 11:48:20,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:17<1:34:08, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:27,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:30,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:27,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:23<1:33:36, 6.77s/it]g-point operations will not be computed-02 11:48:27,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:23<1:33:36, 6.77s/it]g-point operations will not be computed-02 11:48:27,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:23<1:33:36, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:34,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:23<1:33:36, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:34,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:37,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:34,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:37,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:34,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 64/892 [06:30<1:33:09, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:40,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 64/892 [06:30<1:33:09, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:40,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:44,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:40,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:44,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:40,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▊ | 65/892 [06:37<1:32:52, 6.74s/it]g-point operations will not be computed-02 11:48:40,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▊ | 65/892 [06:37<1:32:52, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:47,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:50,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:47,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:50,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:47,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:44<1:32:17, 6.70s/it]g-point operations will not be computed-02 11:48:47,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:44<1:32:17, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:48:54,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:48:57,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:48:54,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-02 11:48:54,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-02 11:48:54,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:50<1:31:47, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:00,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:50<1:31:47, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:00,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:03,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:00,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:03,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:00,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [06:57<1:30:45, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:07,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [06:57<1:30:45, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:07,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:10,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:07,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:10,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:07,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [07:03<1:29:52, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:13,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [07:03<1:29:52, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:13,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:16,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:13,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:16,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:13,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:09<1:29:17, 6.52s/it]g-point operations will not be computed-02 11:49:13,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:09<1:29:17, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:19,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:23,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:19,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:23,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:19,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 71/892 [07:16<1:28:42, 6.48s/it]g-point operations will not be computed-02 11:49:19,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 71/892 [07:16<1:28:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:26,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:26,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:29,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:26,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 72/892 [07:22<1:28:07, 6.45s/it]g-point operations will not be computed-02 11:49:26,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 72/892 [07:22<1:28:07, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:32,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:35,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:32,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▌ | 73/892 [07:28<1:27:07, 6.38s/it]g-point operations will not be computed-02 11:49:32,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▌ | 73/892 [07:28<1:27:07, 6.38s/it]g-point operations will not be computed-02 11:49:32,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▌ | 73/892 [07:28<1:27:07, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:42,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:35<1:26:39, 6.36s/it]g-point operations will not be computed-02 11:49:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:35<1:26:39, 6.36s/it]g-point operations will not be computed-02 11:49:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:35<1:26:39, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:45,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:48,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:45,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:42<1:28:14, 6.48s/it]g-point operations will not be computed-02 11:49:45,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:42<1:28:14, 6.48s/it]g-point operations will not be computed-02 11:49:45,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:42<1:28:14, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:52,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:49:55,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:52,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:48<1:27:02, 6.40s/it]g-point operations will not be computed-02 11:49:52,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:48<1:27:02, 6.40s/it]g-point operations will not be computed-02 11:49:52,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:48<1:27:02, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:49:58,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:01,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:49:58,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [07:54<1:26:07, 6.34s/it]g-point operations will not be computed-02 11:49:58,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [07:54<1:26:07, 6.34s/it]g-point operations will not be computed-02 11:49:58,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [07:54<1:26:07, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:04,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:07,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:04,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [08:00<1:25:00, 6.27s/it]g-point operations will not be computed-02 11:50:04,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [08:00<1:25:00, 6.27s/it]g-point operations will not be computed-02 11:50:04,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [08:00<1:25:00, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:10,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [08:00<1:25:00, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:10,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████ | 79/892 [08:06<1:23:54, 6.19s/it]g-point operations will not be computed-02 11:50:10,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████ | 79/892 [08:06<1:23:54, 6.19s/it]g-point operations will not be computed-02 11:50:10,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████ | 79/892 [08:06<1:23:54, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:16,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:19,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:16,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 80/892 [08:12<1:22:56, 6.13s/it]g-point operations will not be computed-02 11:50:16,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 80/892 [08:12<1:22:56, 6.13s/it]g-point operations will not be computed-02 11:50:16,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 80/892 [08:12<1:22:56, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:22,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:25,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:22,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 81/892 [08:18<1:22:03, 6.07s/it]g-point operations will not be computed-02 11:50:22,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 81/892 [08:18<1:22:03, 6.07s/it]g-point operations will not be computed-02 11:50:22,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 81/892 [08:18<1:22:03, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:28,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:31,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:28,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:31,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:28,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 82/892 [08:24<1:21:03, 6.00s/it]g-point operations will not be computed-02 11:50:28,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 82/892 [08:24<1:21:03, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:34,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:37,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:34,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:37,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:34,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 83/892 [08:30<1:20:05, 5.94s/it]g-point operations will not be computed-02 11:50:34,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 83/892 [08:30<1:20:05, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:39,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:42,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:39,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:42,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:39,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▌ | 84/892 [08:35<1:18:32, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▌ | 84/892 [08:35<1:18:32, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▌ | 84/892 [08:35<1:18:32, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 85/892 [08:41<1:17:06, 5.73s/it]g-point operations will not be computed-02 11:50:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 85/892 [08:41<1:17:06, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:50:50,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:53,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:50,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:53,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:50,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 86/892 [08:46<1:16:08, 5.67s/it]g-point operations will not be computed-02 11:50:50,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:57,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:50,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:50:57,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:50:50,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2596, 'learning_rate': 5.1e-05, 'epoch': 0.1} + 10%|███████▊ | 87/892 [08:52<1:14:59, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:51:01,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:04,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:01,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:04,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:01,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 88/892 [08:57<1:13:41, 5.50s/it]g-point operations will not be computed-02 11:51:01,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:08,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:01,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:08,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:01,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:08,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:01,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 89/892 [09:02<1:12:19, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:14,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████ | 90/892 [09:07<1:10:22, 5.27s/it]g-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:18,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:18,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:20,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:22,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:24,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:24,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:27,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:29,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:29,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:31,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:33,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:33,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:34,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:34,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:36,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:38,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:38,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:39,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:42,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:42,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:44,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:44,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:46,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:46,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:48,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:48,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:50,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:50,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:54,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:54,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:54,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:57,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:51:57,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:01,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:05,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:05,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.286, 'learning_rate': 5.9999999999999995e-05, 'epoch': 0.11} +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:05,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:05,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:05,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 103/892 [10:03<1:15:27, 5.74s/it]g-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:15,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:15,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [10:10<1:20:32, 6.13s/it]g-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [10:10<1:20:32, 6.13s/it]g-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2703, 'learning_rate': 6.12e-05, 'epoch': 0.12} + 12%|█████████▏ | 104/892 [10:10<1:20:32, 6.13s/it]g-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [10:10<1:20:32, 6.13s/it]g-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [10:10<1:20:32, 6.13s/it]g-point operations will not be computed-02 11:51:12,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:17<1:23:57, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:17<1:23:57, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:17<1:23:57, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:24<1:26:10, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:24<1:26:10, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3078, 'learning_rate': 6.239999999999999e-05, 'epoch': 0.12} + 12%|█████████▍ | 106/892 [10:24<1:26:10, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:40,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:40,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3431, 'learning_rate': 6.299999999999999e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:40,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:40,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:40,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▌ | 108/892 [10:38<1:28:03, 6.74s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:50,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:52:50,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 109/892 [10:45<1:28:25, 6.78s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 109/892 [10:45<1:28:25, 6.78s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0367, 'learning_rate': 6.419999999999999e-05, 'epoch': 0.12} + 12%|█████████▋ | 109/892 [10:45<1:28:25, 6.78s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:00,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:00,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1673, 'learning_rate': 6.479999999999999e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:00,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:00,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:00,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▊ | 111/892 [10:59<1:27:52, 6.75s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:10,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:10,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▉ | 112/892 [11:05<1:27:39, 6.74s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▉ | 112/892 [11:05<1:27:39, 6.74s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2113, 'learning_rate': 6.599999999999999e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:19,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 113/892 [11:12<1:27:09, 6.71s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 113/892 [11:12<1:27:09, 6.71s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2212, 'learning_rate': 6.659999999999999e-05, 'epoch': 0.13} + 13%|██████████ | 113/892 [11:12<1:27:09, 6.71s/it]g-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:27,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:27,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1566, 'learning_rate': 6.72e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:27,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:27,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:27,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:52:28,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▏ | 115/892 [11:25<1:26:13, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▏ | 115/892 [11:25<1:26:13, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▏ | 115/892 [11:25<1:26:13, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 116/892 [11:32<1:25:59, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 116/892 [11:32<1:25:59, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9686, 'learning_rate': 6.84e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:45,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 117/892 [11:38<1:25:29, 6.62s/it]g-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 117/892 [11:38<1:25:29, 6.62s/it]g-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2853, 'learning_rate': 6.9e-05, 'epoch': 0.13} + 13%|██████████▎ | 117/892 [11:38<1:25:29, 6.62s/it]g-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:53,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:53,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1564, 'learning_rate': 6.96e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:53,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:53,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:53:53,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:53:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▌ | 119/892 [11:51<1:24:12, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▌ | 119/892 [11:51<1:24:12, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▌ | 119/892 [11:51<1:24:12, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▌ | 119/892 [11:51<1:24:12, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▋ | 120/892 [11:58<1:23:48, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:09,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:09,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:09,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▋ | 121/892 [12:04<1:23:51, 6.53s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:16,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:16,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▊ | 122/892 [12:11<1:22:55, 6.46s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▊ | 122/892 [12:11<1:22:55, 6.46s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:22,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:22,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 123/892 [12:17<1:22:08, 6.41s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 123/892 [12:17<1:22:08, 6.41s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:28,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:28,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 124/892 [12:23<1:21:24, 6.36s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 124/892 [12:23<1:21:24, 6.36s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:35,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:35,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████ | 125/892 [12:30<1:22:19, 6.44s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████ | 125/892 [12:30<1:22:19, 6.44s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2813, 'learning_rate': 7.379999999999999e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:43,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 126/892 [12:36<1:21:35, 6.39s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 126/892 [12:36<1:21:35, 6.39s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3306, 'learning_rate': 7.439999999999999e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:49,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:42<1:20:46, 6.34s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:42<1:20:46, 6.34s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3496, 'learning_rate': 7.5e-05, 'epoch': 0.14} + 14%|███████████▏ | 127/892 [12:42<1:20:46, 6.34s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:42<1:20:46, 6.34s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:57,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:54:57,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:01,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:01,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 129/892 [12:54<1:18:33, 6.18s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 129/892 [12:54<1:18:33, 6.18s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:07,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:07,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 130/892 [13:00<1:17:27, 6.10s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 130/892 [13:00<1:17:27, 6.10s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:13,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:13,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 131/892 [13:06<1:16:49, 6.06s/it]g-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:17,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:17,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:17,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:54:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▋ | 132/892 [13:12<1:16:08, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:22,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▋ | 132/892 [13:12<1:16:08, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:22,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▋ | 132/892 [13:12<1:16:08, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:22,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▋ | 132/892 [13:12<1:16:08, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:22,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▊ | 133/892 [13:18<1:15:04, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▊ | 133/892 [13:18<1:15:04, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:32,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:32,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3009, 'learning_rate': 7.92e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:36,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:36,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▉ | 135/892 [13:29<1:12:39, 5.76s/it]g-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:40,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:43,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:43,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2765, 'learning_rate': 8.04e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:47,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 137/892 [13:40<1:10:23, 5.59s/it]g-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 137/892 [13:40<1:10:23, 5.59s/it]g-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5165, 'learning_rate': 8.1e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:52,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:52,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:28,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 138/892 [13:45<1:08:48, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 138/892 [13:45<1:08:48, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:58,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:55:58,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:01,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:03,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:03,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1739, 'learning_rate': 8.28e-05, 'epoch': 0.16} +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:07,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:07,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:55:55,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▍ | 141/892 [13:59<1:02:02, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:09,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:11,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:09,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:11,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:09,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 142/892 [14:03<58:44, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:13,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:15,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:13,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:15,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:13,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 143/892 [14:07<55:29, 4.44s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:17,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████ | 144/892 [14:11<52:15, 4.19s/it]g-point operations will not be computed-02 11:56:17,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████ | 144/892 [14:11<52:15, 4.19s/it]g-point operations will not be computed-02 11:56:17,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████ | 144/892 [14:11<52:15, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:20,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▏ | 145/892 [14:14<49:10, 3.95s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:23,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▏ | 145/892 [14:14<49:10, 3.95s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:23,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:25,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:23,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:25,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:23,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▎ | 146/892 [14:17<45:50, 3.69s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:26,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▎ | 147/892 [14:20<42:29, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▎ | 147/892 [14:20<42:29, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 148/892 [14:23<39:12, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:32,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 148/892 [14:23<39:12, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:32,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 149/892 [14:25<36:12, 2.92s/it]g-point operations will not be computed-02 11:56:32,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 149/892 [14:25<36:12, 2.92s/it]g-point operations will not be computed-02 11:56:32,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:35,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:34,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 150/892 [14:28<34:42, 2.81s/it]g-point operations will not be computed-02 11:56:34,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 150/892 [14:28<34:42, 2.81s/it]g-point operations will not be computed-02 11:56:34,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 150/892 [14:28<34:42, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:38,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 150/892 [14:28<34:42, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:38,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:42,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:38,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:42,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:38,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 151/892 [14:35<52:22, 4.24s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:45,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 151/892 [14:35<52:22, 4.24s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:45,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:49,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:45,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 152/892 [14:42<1:03:07, 5.12s/it]g-point operations will not be computed-02 11:56:45,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 152/892 [14:42<1:03:07, 5.12s/it]g-point operations will not be computed-02 11:56:45,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 152/892 [14:42<1:03:07, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 152/892 [14:42<1:03:07, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:58,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:58,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4506, 'learning_rate': 9.059999999999999e-05, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:58,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:56:58,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 154/892 [14:57<1:15:20, 6.12s/it]g-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 154/892 [14:57<1:15:20, 6.12s/it]g-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1731, 'learning_rate': 9.12e-05, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:10,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 155/892 [15:03<1:18:07, 6.36s/it]g-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 155/892 [15:03<1:18:07, 6.36s/it]g-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1782, 'learning_rate': 9.18e-05, 'epoch': 0.17} + 17%|█████████████▋ | 155/892 [15:03<1:18:07, 6.36s/it]g-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 155/892 [15:03<1:18:07, 6.36s/it]g-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 155/892 [15:03<1:18:07, 6.36s/it]g-point operations will not be computed-02 11:56:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [15:10<1:19:54, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [15:10<1:19:54, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [15:10<1:19:54, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|█████████████▉ | 157/892 [15:17<1:21:02, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|█████████████▉ | 157/892 [15:17<1:21:02, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4489, 'learning_rate': 9.3e-05, 'epoch': 0.18} + 18%|█████████████▉ | 157/892 [15:17<1:21:02, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:32,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:32,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.51, 'learning_rate': 9.36e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:32,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:32,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████ | 159/892 [15:31<1:21:54, 6.70s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████ | 159/892 [15:31<1:21:54, 6.70s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:43,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:43,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▏ | 160/892 [15:38<1:22:14, 6.74s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▏ | 160/892 [15:38<1:22:14, 6.74s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3013, 'learning_rate': 9.479999999999999e-05, 'epoch': 0.18} + 18%|██████████████▏ | 160/892 [15:38<1:22:14, 6.74s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:53,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:53,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3347, 'learning_rate': 9.539999999999999e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:53,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2858, 'learning_rate': 9.599999999999999e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:57:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▍ | 163/892 [15:58<1:21:14, 6.69s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:09,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:09,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:09,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 164/892 [16:04<1:20:57, 6.67s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 164/892 [16:04<1:20:57, 6.67s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:17,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:17,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 165/892 [16:11<1:20:19, 6.63s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 165/892 [16:11<1:20:19, 6.63s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:24,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:24,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [16:17<1:19:38, 6.58s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [16:17<1:19:38, 6.58s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [16:17<1:19:38, 6.58s/it]g-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:32,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:32,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.306, 'learning_rate': 9.9e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:32,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1518, 'learning_rate': 9.96e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:58:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:57:20,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:36<1:17:58, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:47,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:36<1:17:58, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:47,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:36<1:17:58, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:47,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:36<1:17:58, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:47,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████ | 170/892 [16:43<1:17:38, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████ | 170/892 [16:43<1:17:38, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████ | 170/892 [16:43<1:17:38, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████ | 170/892 [16:43<1:17:38, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▏ | 171/892 [16:49<1:16:58, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:01,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:01,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▏ | 172/892 [16:56<1:16:45, 6.40s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▏ | 172/892 [16:56<1:16:45, 6.40s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:07,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:07,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▎ | 173/892 [17:02<1:16:13, 6.36s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▎ | 173/892 [17:02<1:16:13, 6.36s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3668, 'learning_rate': 0.0001026, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:15,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 174/892 [17:08<1:15:50, 6.34s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 174/892 [17:08<1:15:50, 6.34s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1735, 'learning_rate': 0.00010319999999999999, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:21,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3279, 'learning_rate': 0.00010379999999999999, 'epoch': 0.2} + g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:29,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:29,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2638, 'learning_rate': 0.00010439999999999999, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:29,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:35,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:35,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2474, 'learning_rate': 0.00010499999999999999, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:40,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▊ | 178/892 [17:33<1:13:32, 6.18s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▊ | 178/892 [17:33<1:13:32, 6.18s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2505, 'learning_rate': 0.00010559999999999998, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:46,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▊ | 179/892 [17:39<1:12:35, 6.11s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▊ | 179/892 [17:39<1:12:35, 6.11s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:50,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:50,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▉ | 180/892 [17:45<1:11:47, 6.05s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▉ | 180/892 [17:45<1:11:47, 6.05s/it]g-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:56,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 11:59:56,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 11:58:53,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 181/892 [17:51<1:10:45, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 181/892 [17:51<1:10:45, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3573, 'learning_rate': 0.00010739999999999998, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:05,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:05,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3769, 'learning_rate': 0.00010799999999999998, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:05,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:10,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:10,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3471, 'learning_rate': 0.00010859999999999998, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:10,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:16,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:16,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7017, 'learning_rate': 0.00010919999999999998, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:20,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:00,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▍ | 185/892 [18:13<1:06:52, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▍ | 185/892 [18:13<1:06:52, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3939, 'learning_rate': 0.00010979999999999999, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:27,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:27,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2426, 'learning_rate': 0.00011039999999999999, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:31,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:31,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▌ | 187/892 [18:24<1:04:22, 5.48s/it]g-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:35,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:35,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:37,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:37,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:41,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▋ | 189/892 [18:34<1:01:46, 5.27s/it]g-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▋ | 189/892 [18:34<1:01:46, 5.27s/it]g-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:45,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:47,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:47,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:50,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:50,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:23,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████▎ | 191/892 [18:43<58:41, 5.02s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:53,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████▎ | 191/892 [18:43<58:41, 5.02s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:53,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:55,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:53,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▍ | 192/892 [18:48<56:29, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:57,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▍ | 192/892 [18:48<56:29, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:00:57,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:00:59,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:00:57,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 193/892 [18:52<54:02, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:01,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 193/892 [18:52<54:02, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:01,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:03,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:01,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 194/892 [18:56<50:59, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:05,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 194/892 [18:56<50:59, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:05,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▋ | 195/892 [18:59<47:47, 4.11s/it]g-point operations will not be computed-02 12:01:05,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▋ | 195/892 [18:59<47:47, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:09,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▋ | 195/892 [18:59<47:47, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:09,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▊ | 196/892 [19:02<44:16, 3.82s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▊ | 196/892 [19:02<44:16, 3.82s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▉ | 197/892 [19:05<40:38, 3.51s/it]g-point operations will not be computed-02 12:01:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▉ | 197/892 [19:05<40:38, 3.51s/it]g-point operations will not be computed-02 12:01:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:16,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:16,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:18,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:17,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:20,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:19,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:20,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:19,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0053, 'learning_rate': 0.0001182, 'epoch': 0.22} + 22%|██████████████████▏ | 200/892 [19:13<32:28, 2.82s/it]g-point operations will not be computed-02 12:01:19,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▏ | 200/892 [19:13<32:28, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:23,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▏ | 200/892 [19:13<32:28, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:23,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:27,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:23,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 201/892 [19:20<48:20, 4.20s/it]g-point operations will not be computed-02 12:01:23,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 201/892 [19:20<48:20, 4.20s/it]g-point operations will not be computed-02 12:01:23,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 201/892 [19:20<48:20, 4.20s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:30,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:34,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:30,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:27<58:42, 5.10s/it]g-point operations will not be computed-02 12:01:30,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:27<58:42, 5.10s/it]g-point operations will not be computed-02 12:01:30,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|��█████████████████▎ | 202/892 [19:27<58:42, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:27<58:42, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:27<58:42, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:34<1:05:45, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:34<1:05:45, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:46,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:46,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:01:46,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████ | 204/892 [19:41<1:10:02, 6.11s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████ | 204/892 [19:41<1:10:02, 6.11s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████ | 204/892 [19:41<1:10:02, 6.11s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████ | 204/892 [19:41<1:10:02, 6.11s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [19:48<1:12:44, 6.35s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [19:48<1:12:44, 6.35s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:00,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:00,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [19:55<1:14:29, 6.52s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [19:55<1:14:29, 6.52s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2588, 'learning_rate': 0.0001224, 'epoch': 0.23} + 23%|██████████████████▏ | 206/892 [19:55<1:14:29, 6.52s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2876, 'learning_rate': 0.00012299999999999998, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [20:09<1:16:06, 6.68s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [20:09<1:16:06, 6.68s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:21,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:21,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:21,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▌ | 209/892 [20:16<1:16:23, 6.71s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▌ | 209/892 [20:16<1:16:23, 6.71s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:29,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:29,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [20:22<1:16:24, 6.72s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [20:22<1:16:24, 6.72s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [20:22<1:16:24, 6.72s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:37,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:37,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3784, 'learning_rate': 0.00012539999999999999, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:37,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:37,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:37,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▊ | 212/892 [20:36<1:15:39, 6.68s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:47,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:47,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:47,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▊ | 213/892 [20:42<1:15:16, 6.65s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▊ | 213/892 [20:42<1:15:16, 6.65s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:56,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:02:56,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [20:49<1:15:00, 6.64s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [20:49<1:15:00, 6.64s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [20:49<1:15:00, 6.64s/it]g-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:04,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:04,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2635, 'learning_rate': 0.0001278, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:04,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:10,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:10,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3944, 'learning_rate': 0.00012839999999999998, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:10,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:10,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:10,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:01:37,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 217/892 [21:08<1:13:27, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 217/892 [21:08<1:13:27, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 217/892 [21:08<1:13:27, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 217/892 [21:08<1:13:27, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 218/892 [21:15<1:13:06, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:26,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:26,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:26,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 219/892 [21:21<1:12:28, 6.46s/it]g-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 219/892 [21:21<1:12:28, 6.46s/it]g-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:34,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 220/892 [21:28<1:12:16, 6.45s/it]g-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 220/892 [21:28<1:12:16, 6.45s/it]g-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3954, 'learning_rate': 0.00013079999999999998, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:41,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▌ | 221/892 [21:34<1:12:07, 6.45s/it]g-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▌ | 221/892 [21:34<1:12:07, 6.45s/it]g-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2565, 'learning_rate': 0.0001314, 'epoch': 0.25} + 25%|███████████████████▌ | 221/892 [21:34<1:12:07, 6.45s/it]g-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:49,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:49,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3935, 'learning_rate': 0.00013199999999999998, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:49,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4942, 'learning_rate': 0.0001326, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-02 12:03:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3912, 'learning_rate': 0.00013319999999999999, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:03:18,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▉ | 225/892 [22:00<1:11:40, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▉ | 225/892 [22:00<1:11:40, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▉ | 225/892 [22:00<1:11:40, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▉ | 225/892 [22:00<1:11:40, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████ | 226/892 [22:06<1:10:53, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████ | 227/892 [22:12<1:10:01, 6.32s/it]g-point operations will not be computed-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:23,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:23,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:23,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:10,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▏ | 228/892 [22:18<1:09:17, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▏ | 228/892 [22:18<1:09:17, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:32,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:32,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3784, 'learning_rate': 0.0001362, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:32,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:38,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:38,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4013, 'learning_rate': 0.0001368, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:38,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:44,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:44,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7712, 'learning_rate': 0.0001374, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:44,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:50,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:50,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5995, 'learning_rate': 0.000138, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:54,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 233/892 [22:47<1:04:32, 5.88s/it]g-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 233/892 [22:47<1:04:32, 5.88s/it]g-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:59,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:04:59,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:04:28,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 234/892 [22:53<1:03:21, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 234/892 [22:53<1:03:21, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6203, 'learning_rate': 0.0001392, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:07,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:07,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5716, 'learning_rate': 0.00013979999999999998, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:11,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▉ | 236/892 [23:04<1:01:19, 5.61s/it]g-point operations will not be computed-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▉ | 236/892 [23:04<1:01:19, 5.61s/it]g-point operations will not be computed-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:15,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:15,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:03,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|████████████████████▉ | 237/892 [23:09<1:00:05, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:05:19,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|████████████████████▉ | 237/892 [23:09<1:00:05, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:05:19,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2867, 'learning_rate': 0.00014099999999999998, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:23,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:19,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:23,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:19,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:25,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:19,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:25,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:19,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:25,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:19,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▋ | 239/892 [23:19<57:35, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▋ | 239/892 [23:19<57:35, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▋ | 239/892 [23:19<57:35, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:33,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:35,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:35,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:37,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:39,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:39,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:41,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:44,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:44,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:45,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:47,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:47,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:49,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:51,443 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:51,443 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:53,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:56,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:56,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:57,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:57,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:59,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:05:59,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:01,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:01,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:03,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:06,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:06,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3328, 'learning_rate': 0.00014879999999999998, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:10,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:10,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:10,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:13,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:13,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:17,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:17,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:17,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:20,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:20,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 253/892 [24:19<1:00:40, 5.70s/it]g-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 253/892 [24:19<1:00:40, 5.70s/it]g-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 253/892 [24:19<1:00:40, 5.70s/it]g-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 253/892 [24:19<1:00:40, 5.70s/it]g-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 253/892 [24:19<1:00:40, 5.70s/it]g-point operations will not be computed-02 12:05:29,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:26<1:04:43, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:26<1:04:43, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:26<1:04:43, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:26<1:04:43, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▌ | 255/892 [24:33<1:07:47, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▌ | 255/892 [24:33<1:07:47, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|████████████████��█████▌ | 255/892 [24:33<1:07:47, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:49,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:49,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5144, 'learning_rate': 0.0001524, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:49,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:49,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:49,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 257/892 [24:47<1:10:43, 6.68s/it]g-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:59,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:06:59,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [24:54<1:11:09, 6.73s/it]g-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [24:54<1:11:09, 6.73s/it]g-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3156, 'learning_rate': 0.0001536, 'epoch': 0.29} + 29%|██████████████████████▊ | 258/892 [24:54<1:11:09, 6.73s/it]g-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [24:54<1:11:09, 6.73s/it]g-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [24:54<1:11:09, 6.73s/it]g-point operations will not be computed-02 12:06:36,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:01<1:11:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:01<1:11:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:01<1:11:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:01<1:11:07, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 260/892 [25:08<1:11:05, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:19,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:19,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:19,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 261/892 [25:14<1:10:56, 6.75s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 261/892 [25:14<1:10:56, 6.75s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 261/892 [25:14<1:10:56, 6.75s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:29,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:29,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5021, 'learning_rate': 0.000156, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:29,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:36,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:36,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4703, 'learning_rate': 0.00015659999999999998, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:36,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:36,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:36,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████�� | 264/892 [25:34<1:10:01, 6.69s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:46,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:46,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▍ | 265/892 [25:41<1:09:53, 6.69s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▍ | 265/892 [25:41<1:09:53, 6.69s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5204, 'learning_rate': 0.0001578, 'epoch': 0.3} + 30%|███████████████████████▍ | 265/892 [25:41<1:09:53, 6.69s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:56,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:56,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8227, 'learning_rate': 0.0001584, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-02 12:07:56,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:03,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:03,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4607, 'learning_rate': 0.000159, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:03,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:03,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:03,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▋ | 268/892 [26:01<1:08:44, 6.61s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:12,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:12,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▊ | 269/892 [26:07<1:08:12, 6.57s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▊ | 269/892 [26:07<1:08:12, 6.57s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:19,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:19,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▉ | 270/892 [26:14<1:07:51, 6.55s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▉ | 270/892 [26:14<1:07:51, 6.55s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.584, 'learning_rate': 0.0001608, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:27,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 271/892 [26:20<1:07:37, 6.53s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 271/892 [26:20<1:07:37, 6.53s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2784, 'learning_rate': 0.0001614, 'epoch': 0.3} + 30%|████████████████████████ | 271/892 [26:20<1:07:37, 6.53s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:35,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:35,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4427, 'learning_rate': 0.000162, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:35,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7132, 'learning_rate': 0.0001626, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:48,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:48,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:48,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3542, 'learning_rate': 0.0001632, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:48,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▎ | 275/892 [26:46<1:07:03, 6.52s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▎ | 275/892 [26:46<1:07:03, 6.52s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8528, 'learning_rate': 0.0001638, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-02 12:08:59,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▍ | 276/892 [26:52<1:06:14, 6.45s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▍ | 276/892 [26:52<1:06:14, 6.45s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.848, 'learning_rate': 0.0001644, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:05,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 277/892 [26:59<1:05:24, 6.38s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 277/892 [26:59<1:05:24, 6.38s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6258, 'learning_rate': 0.000165, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:12,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 278/892 [27:05<1:04:40, 6.32s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 278/892 [27:05<1:04:40, 6.32s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2584, 'learning_rate': 0.0001656, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:18,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [27:11<1:03:47, 6.24s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [27:11<1:03:47, 6.24s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4303, 'learning_rate': 0.0001662, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:24,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▊ | 280/892 [27:17<1:02:59, 6.18s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▊ | 280/892 [27:17<1:02:59, 6.18s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:28,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:28,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|████████████████████████▉ | 281/892 [27:23<1:02:17, 6.12s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|████████████████████████▉ | 281/892 [27:23<1:02:17, 6.12s/it]g-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:34,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:34,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:07:11,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|████████████████████████▉ | 282/892 [27:29<1:01:37, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:09:39,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|████████████████████████▉ | 282/892 [27:29<1:01:37, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:09:39,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4254, 'learning_rate': 0.000168, 'epoch': 0.32} + 32%|████████████████████████▉ | 282/892 [27:29<1:01:37, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:09:39,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|████████████████████████▉ | 282/892 [27:29<1:01:37, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:09:39,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████ | 283/892 [27:34<1:00:27, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████ | 283/892 [27:34<1:00:27, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:48,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:48,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5322, 'learning_rate': 0.00016919999999999997, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:52,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 285/892 [27:45<57:46, 5.71s/it]g-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 285/892 [27:45<57:46, 5.71s/it]g-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:57,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:59,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:09:59,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4425, 'learning_rate': 0.00017039999999999997, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:03,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████ | 287/892 [27:56<55:25, 5.50s/it]g-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████ | 287/892 [27:56<55:25, 5.50s/it]g-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:07,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:07,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:07,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:09:44,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 288/892 [28:01<54:20, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:13,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 289/892 [28:06<52:59, 5.27s/it]g-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 289/892 [28:06<52:59, 5.27s/it]g-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:17,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:19,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:19,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:22,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:24,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:24,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6296, 'learning_rate': 0.00017339999999999996, 'epoch': 0.33} +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:27,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:27,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 292/892 [28:20<47:24, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:29,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:31,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:29,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:31,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:29,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 293/892 [28:24<45:08, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:33,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 294/892 [28:28<42:42, 4.28s/it]g-point operations will not be computed-02 12:10:33,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 294/892 [28:28<42:42, 4.28s/it]g-point operations will not be computed-02 12:10:33,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 294/892 [28:28<42:42, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:37,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 294/892 [28:28<42:42, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:37,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▊ | 295/892 [28:31<40:16, 4.05s/it]g-point operations will not be computed-02 12:10:37,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:42,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:40,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:42,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:40,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 296/892 [28:34<37:19, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:43,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 296/892 [28:34<37:19, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:43,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 297/892 [28:37<34:17, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:46,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 297/892 [28:37<34:17, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:46,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|███████████████████████████ | 298/892 [28:39<31:34, 3.19s/it]g-point operations will not be computed-02 12:10:46,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|███████████████████████████ | 298/892 [28:39<31:34, 3.19s/it]g-point operations will not be computed-02 12:10:46,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 299/892 [28:42<28:35, 2.89s/it]g-point operations will not be computed-02 12:10:48,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:52,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:51,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:52,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:51,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 300/892 [28:44<27:35, 2.80s/it]g-point operations will not be computed-02 12:10:51,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 300/892 [28:44<27:35, 2.80s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:10:55,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:55,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:10:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:10:55,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▎ | 301/892 [28:52<41:34, 4.22s/it]g-point operations will not be computed-02 12:10:55,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▎ | 301/892 [28:52<41:34, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:11:02,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▎ | 301/892 [28:52<41:34, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:11:02,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:06,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:02,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:06,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:02,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 302/892 [28:59<50:13, 5.11s/it]g-point operations will not be computed-02 12:11:02,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 302/892 [28:59<50:13, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:13,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:06<56:28, 5.75s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:06<56:28, 5.75s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4828, 'learning_rate': 0.00018059999999999997, 'epoch': 0.34} + 34%|███████████████████████████▌ | 303/892 [29:06<56:28, 5.75s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:06<56:28, 5.75s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:06<56:28, 5.75s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|██████████████████████████▉ | 304/892 [29:13<1:01:02, 6.23s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|██████████████████████████▉ | 304/892 [29:13<1:01:02, 6.23s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|██████████████████████████▉ | 304/892 [29:13<1:01:02, 6.23s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:29,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:29,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4415, 'learning_rate': 0.00018179999999999997, 'epoch': 0.34} +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:29,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:29,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:29,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [29:28<1:06:36, 6.82s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [29:28<1:06:36, 6.82s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [29:28<1:06:36, 6.82s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [29:28<1:06:36, 6.82s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [29:28<1:06:36, 6.82s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [29:36<1:08:08, 6.99s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [29:36<1:08:08, 6.99s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:11:49,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 308/892 [29:43<1:08:52, 7.08s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 308/892 [29:43<1:08:52, 7.08s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1051, 'learning_rate': 0.0001836, 'epoch': 0.35} + 35%|███████████████████████████▎ | 308/892 [29:43<1:08:52, 7.08s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 308/892 [29:43<1:08:52, 7.08s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 308/892 [29:43<1:08:52, 7.08s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [29:50<1:09:02, 7.11s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [29:50<1:09:02, 7.11s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [29:50<1:09:02, 7.11s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [29:50<1:09:02, 7.11s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [29:50<1:09:02, 7.11s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▍ | 310/892 [29:58<1:10:07, 7.23s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:10,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:10,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:10,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▌ | 311/892 [30:05<1:09:47, 7.21s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▌ | 311/892 [30:05<1:09:47, 7.21s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▌ | 311/892 [30:05<1:09:47, 7.21s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:20,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:20,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6674, 'learning_rate': 0.000186, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:20,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:29,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:29,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5483, 'learning_rate': 0.00018659999999999998, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:29,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:29,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▊ | 314/892 [30:27<1:11:04, 7.38s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▊ | 314/892 [30:27<1:11:04, 7.38s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6706, 'learning_rate': 0.0001872, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-02 12:12:41,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 315/892 [30:34<1:10:00, 7.28s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 315/892 [30:34<1:10:00, 7.28s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4163, 'learning_rate': 0.00018779999999999998, 'epoch': 0.35} + 35%|███████████████████████████▉ | 315/892 [30:34<1:10:00, 7.28s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 315/892 [30:34<1:10:00, 7.28s/it]g-point operations will not be computed-02 12:11:09,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 316/892 [30:41<1:08:56, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|█████���█████████████████████▉ | 316/892 [30:41<1:08:56, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7195, 'learning_rate': 0.00018839999999999997, 'epoch': 0.35} + 35%|███████████████████████████▉ | 316/892 [30:41<1:08:56, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████ | 317/892 [30:48<1:07:57, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████ | 317/892 [30:48<1:07:57, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3358, 'learning_rate': 0.00018899999999999999, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:02,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▏ | 318/892 [30:55<1:06:52, 6.99s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▏ | 318/892 [30:55<1:06:52, 6.99s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6431, 'learning_rate': 0.00018959999999999997, 'epoch': 0.36} + 36%|████████████████████████████▏ | 318/892 [30:55<1:06:52, 6.99s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▏ | 318/892 [30:55<1:06:52, 6.99s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▎ | 319/892 [31:02<1:06:05, 6.92s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▎ | 319/892 [31:02<1:06:05, 6.92s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:13,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:13,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▎ | 320/892 [31:08<1:05:18, 6.85s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▎ | 320/892 [31:08<1:05:18, 6.85s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5086, 'learning_rate': 0.00019079999999999998, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:22,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▍ | 321/892 [31:15<1:04:57, 6.83s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▍ | 321/892 [31:15<1:04:57, 6.83s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9276, 'learning_rate': 0.0001914, 'epoch': 0.36} + 36%|████████████████████████████▍ | 321/892 [31:15<1:04:57, 6.83s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▍ | 321/892 [31:15<1:04:57, 6.83s/it]g-point operations will not be computed-02 12:12:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 322/892 [31:22<1:04:45, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 322/892 [31:22<1:04:45, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3389, 'learning_rate': 0.00019199999999999998, 'epoch': 0.36} + 36%|████████████████████████████▌ | 322/892 [31:22<1:04:45, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 323/892 [31:29<1:04:44, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 323/892 [31:29<1:04:44, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:41,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:41,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▋ | 324/892 [31:35<1:04:07, 6.77s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▋ | 324/892 [31:35<1:04:07, 6.77s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7336, 'learning_rate': 0.00019319999999999998, 'epoch': 0.36} + 36%|████████████████████████████▋ | 324/892 [31:35<1:04:07, 6.77s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▋ | 324/892 [31:35<1:04:07, 6.77s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▊ | 325/892 [31:43<1:05:23, 6.92s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▊ | 325/892 [31:43<1:05:23, 6.92s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:54,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:13:54,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▊ | 326/892 [31:49<1:04:17, 6.81s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▊ | 326/892 [31:49<1:04:17, 6.81s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:01,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:01,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:01,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▉ | 327/892 [31:56<1:03:01, 6.69s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▉ | 327/892 [31:56<1:03:01, 6.69s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▉ | 327/892 [31:56<1:03:01, 6.69s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▉ | 327/892 [31:56<1:03:01, 6.69s/it]g-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:10,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:10,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:10,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:17,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:17,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0732, 'learning_rate': 0.0001962, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:17,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:17,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:13:32,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1987, 'learning_rate': 0.00019679999999999999, 'epoch': 0.37} + 37%|█████████████████████████████▏ | 330/892 [32:15<1:00:23, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▏ | 330/892 [32:15<1:00:23, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:29,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:29,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4289, 'learning_rate': 0.0001974, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:29,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:29,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:29,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▏ | 332/892 [32:27<58:52, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:37,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▏ | 332/892 [32:27<58:52, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:37,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▏ | 332/892 [32:27<58:52, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:37,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▏ | 332/892 [32:27<58:52, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:37,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▏ | 333/892 [32:33<58:53, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▏ | 333/892 [32:33<58:53, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:48,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:48,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.697, 'learning_rate': 0.0001992, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:48,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:54,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:54,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7254, 'learning_rate': 0.0001998, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:54,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:59,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:14:59,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4706, 'learning_rate': 0.0002004, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:04,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:04,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 337/892 [32:57<54:37, 5.91s/it]g-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:08,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:08,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:08,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:14:43,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▋ | 338/892 [33:02<53:09, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:12,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▋ | 338/892 [33:02<53:09, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:12,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:16,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:12,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:16,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:12,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5032, 'learning_rate': 0.0002022, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:20,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:12,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:20,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:12,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▊ | 340/892 [33:12<50:24, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▊ | 340/892 [33:12<50:24, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:26,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:26,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:28,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:31,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:31,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5937, 'learning_rate': 0.000204, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:34,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:34,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|███████████████████████████████▏ | 343/892 [33:26<44:34, 4.87s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:36,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:38,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:36,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:38,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:36,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▏ | 344/892 [33:30<42:01, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:40,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▎ | 345/892 [33:34<38:56, 4.27s/it]g-point operations will not be computed-02 12:15:40,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▎ | 345/892 [33:34<38:56, 4.27s/it]g-point operations will not be computed-02 12:15:40,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:45,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:43,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:45,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:43,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▍ | 346/892 [33:37<35:53, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:46,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 347/892 [33:40<32:52, 3.62s/it]g-point operations will not be computed-02 12:15:46,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 347/892 [33:40<32:52, 3.62s/it]g-point operations will not be computed-02 12:15:46,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:50,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:49,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:50,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:49,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:53,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:52,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:53,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:52,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:55,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:54,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:15:55,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:54,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 350/892 [33:47<25:54, 2.87s/it]g-point operations will not be computed-02 12:15:54,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 350/892 [33:47<25:54, 2.87s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:58,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 350/892 [33:47<25:54, 2.87s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:15:58,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:01,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:58,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:01,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:15:58,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 351/892 [33:55<38:32, 4.27s/it]g-point operations will not be computed-02 12:15:58,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 351/892 [33:55<38:32, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:05,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:09,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:05,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [34:02<46:25, 5.16s/it]g-point operations will not be computed-02 12:16:05,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [34:02<46:25, 5.16s/it]g-point operations will not be computed-02 12:16:05,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [34:02<46:25, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [34:02<46:25, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [34:02<46:25, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [34:02<46:25, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 353/892 [34:09<51:49, 5.77s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:21,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:21,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [34:16<55:14, 6.16s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████��███████████████████████████▏ | 354/892 [34:16<55:14, 6.16s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9139, 'learning_rate': 0.00021119999999999996, 'epoch': 0.4} + 40%|████████████████████████████████▏ | 354/892 [34:16<55:14, 6.16s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [34:16<55:14, 6.16s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [34:16<55:14, 6.16s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 355/892 [34:23<57:31, 6.43s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:35,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:35,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [34:30<59:07, 6.62s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [34:30<59:07, 6.62s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1954, 'learning_rate': 0.00021239999999999996, 'epoch': 0.4} + 40%|████████████████████████████████▎ | 356/892 [34:30<59:07, 6.62s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [34:30<59:07, 6.62s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [34:30<59:07, 6.62s/it]g-point operations will not be computed-02 12:16:12,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▌ | 357/892 [34:37<1:00:00, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▌ | 357/892 [34:37<1:00:00, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▌ | 357/892 [34:37<1:00:00, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▋ | 358/892 [34:44<1:00:29, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▋ | 358/892 [34:44<1:00:29, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0957, 'learning_rate': 0.00021359999999999996, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-02 12:16:58,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▊ | 359/892 [34:51<1:00:33, 6.82s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▊ | 359/892 [34:51<1:00:33, 6.82s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6529, 'learning_rate': 0.00021419999999999998, 'epoch': 0.4} + 40%|███████████████████████████████▊ | 359/892 [34:51<1:00:33, 6.82s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:06,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:06,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7965, 'learning_rate': 0.00021479999999999996, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:06,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:06,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▉ | 361/892 [35:05<1:00:15, 6.81s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▉ | 361/892 [35:05<1:00:15, 6.81s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8971, 'learning_rate': 0.00021539999999999998, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:18,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|████████████████████████████████ | 362/892 [35:12<1:00:00, 6.79s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|████████████████████████████████ | 362/892 [35:12<1:00:00, 6.79s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5586, 'learning_rate': 0.00021599999999999996, 'epoch': 0.41} + 41%|████████████████████████████████ | 362/892 [35:12<1:00:00, 6.79s/it]g-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:27,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:27,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4938, 'learning_rate': 0.00021659999999999998, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:27,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:27,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:16:48,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████ | 364/892 [35:25<59:15, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████ | 364/892 [35:25<59:15, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.777, 'learning_rate': 0.00021719999999999997, 'epoch': 0.41} + 41%|█████████████████████████████████ | 364/892 [35:25<59:15, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 365/892 [35:32<58:50, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 365/892 [35:32<58:50, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4398, 'learning_rate': 0.00021779999999999998, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:45,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 366/892 [35:38<58:29, 6.67s/it]g-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 366/892 [35:38<58:29, 6.67s/it]g-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9263, 'learning_rate': 0.00021839999999999997, 'epoch': 0.41} + 41%|█████████████████████████████████▏ | 366/892 [35:38<58:29, 6.67s/it]g-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:53,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:53,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6826, 'learning_rate': 0.00021899999999999998, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-02 12:17:53,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:00,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:00,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:00,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5316, 'learning_rate': 0.00021959999999999997, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:00,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:17:35,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 369/892 [35:58<57:10, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 369/892 [35:58<57:10, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7346, 'learning_rate': 0.00022019999999999999, 'epoch': 0.41} + 41%|█████████████████████████████████▌ | 369/892 [35:58<57:10, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 369/892 [35:58<57:10, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 370/892 [36:04<56:47, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 370/892 [36:04<56:47, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:17,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:17,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▋ | 371/892 [36:11<56:22, 6.49s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▋ | 371/892 [36:11<56:22, 6.49s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:24,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:24,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 372/892 [36:17<56:18, 6.50s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 372/892 [36:17<56:18, 6.50s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:30,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 373/892 [36:24<55:57, 6.47s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 373/892 [36:24<55:57, 6.47s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7205, 'learning_rate': 0.0002226, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:37,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▉ | 374/892 [36:30<55:03, 6.38s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▉ | 374/892 [36:30<55:03, 6.38s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9808, 'learning_rate': 0.00022319999999999998, 'epoch': 0.42} + 42%|█████████████████████████████████▉ | 374/892 [36:30<55:03, 6.38s/it]g-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:45,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:45,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4609, 'learning_rate': 0.0002238, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:45,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:45,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:18:45,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:18:08,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [36:43<54:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:53,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [36:43<54:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:53,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [36:43<54:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:53,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [36:43<54:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:53,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 377/892 [36:49<54:00, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:59,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 377/892 [36:49<54:00, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:59,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 377/892 [36:49<54:00, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:59,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 377/892 [36:49<54:00, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:18:59,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 378/892 [36:55<53:21, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 378/892 [36:55<53:21, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:09,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:09,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5312, 'learning_rate': 0.00022619999999999997, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:09,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:15,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:15,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7006, 'learning_rate': 0.00022679999999999998, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:19,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 381/892 [37:13<51:24, 6.04s/it]g-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 381/892 [37:13<51:24, 6.04s/it]g-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5056, 'learning_rate': 0.00022739999999999997, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:25,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:25,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▋ | 382/892 [37:18<50:53, 5.99s/it]g-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:30,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:30,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:30,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▊ | 383/892 [37:24<50:05, 5.91s/it]g-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:35,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:38,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:38,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6337, 'learning_rate': 0.0002292, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:42,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▉ | 385/892 [37:35<48:20, 5.72s/it]g-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▉ | 385/892 [37:35<48:20, 5.72s/it]g-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6499, 'learning_rate': 0.00022979999999999997, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:48,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:48,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████ | 386/892 [37:41<47:24, 5.62s/it]g-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:52,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:52,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:52,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:05,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████▏ | 387/892 [37:46<46:36, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:19:56,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:19:58,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:56,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████▏ | 388/892 [37:51<45:32, 5.42s/it]g-point operations will not be computed-02 12:19:56,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████▏ | 388/892 [37:51<45:32, 5.42s/it]g-point operations will not be computed-02 12:19:56,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:02,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:56,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:02,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:56,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:02,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:19:56,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▎ | 389/892 [37:56<44:31, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:08,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▍ | 390/892 [38:01<43:19, 5.18s/it]g-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▍ | 390/892 [38:01<43:19, 5.18s/it]g-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:12,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:14,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:14,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:16,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:19,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:19,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:21,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:23,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:23,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:27,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:27,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:29,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:30,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:30,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:32,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:32,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:34,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:37,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:37,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:39,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:39,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:40,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:40,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:42,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:44,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:44,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.215, 'learning_rate': 0.0002388, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:51,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:55,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:55,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:58,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:58,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.897, 'learning_rate': 0.00023999999999999998, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:58,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:58,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:20:58,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:20:06,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▌ | 403/892 [38:57<46:34, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▌ | 403/892 [38:57<46:34, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▌ | 403/892 [38:57<46:34, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▋ | 404/892 [39:04<49:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▋ | 404/892 [39:04<49:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7273, 'learning_rate': 0.00024119999999999998, 'epoch': 0.45} + 45%|████████████████████████████████████▋ | 404/892 [39:04<49:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:20,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:20,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8053, 'learning_rate': 0.0002418, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:20,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:20,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▊ | 406/892 [39:18<53:02, 6.55s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▊ | 406/892 [39:18<53:02, 6.55s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9928, 'learning_rate': 0.00024239999999999998, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:32,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 407/892 [39:25<53:49, 6.66s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 407/892 [39:25<53:49, 6.66s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5314, 'learning_rate': 0.000243, 'epoch': 0.46} + 46%|████████████████████████████████████▉ | 407/892 [39:25<53:49, 6.66s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 407/892 [39:25<53:49, 6.66s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 407/892 [39:25<53:49, 6.66s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████ | 408/892 [39:32<54:33, 6.76s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:44,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:44,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 409/892 [39:39<54:42, 6.80s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 409/892 [39:39<54:42, 6.80s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6468, 'learning_rate': 0.00024419999999999997, 'epoch': 0.46} + 46%|█████████████████████████████████████▏ | 409/892 [39:39<54:42, 6.80s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:54,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:54,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8918, 'learning_rate': 0.0002448, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:54,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:54,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:21:54,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▎ | 411/892 [39:53<54:23, 6.79s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:04,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:04,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 412/892 [39:59<54:02, 6.75s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 412/892 [39:59<54:02, 6.75s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8, 'learning_rate': 0.00024599999999999996, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:13,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 413/892 [40:06<53:49, 6.74s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 413/892 [40:06<53:49, 6.74s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.212, 'learning_rate': 0.0002466, 'epoch': 0.46} + 46%|█████████████████████████████████████▌ | 413/892 [40:06<53:49, 6.74s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 413/892 [40:06<53:49, 6.74s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 413/892 [40:06<53:49, 6.74s/it]g-point operations will not be computed-02 12:21:07,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 414/892 [40:13<53:40, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 414/892 [40:13<53:40, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|███████��█████████████████████████████▌ | 414/892 [40:13<53:40, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▋ | 415/892 [40:19<53:19, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▋ | 415/892 [40:19<53:19, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:31,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:31,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 416/892 [40:26<53:00, 6.68s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 416/892 [40:26<53:00, 6.68s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6498, 'learning_rate': 0.00024839999999999997, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:39,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 417/892 [40:33<52:41, 6.66s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 417/892 [40:33<52:41, 6.66s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7483, 'learning_rate': 0.000249, 'epoch': 0.47} + 47%|█████████████████████████████████████▊ | 417/892 [40:33<52:41, 6.66s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:48,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:48,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7704, 'learning_rate': 0.00024959999999999994, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:48,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:48,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████��� | 419/892 [40:46<52:11, 6.62s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████ | 419/892 [40:46<52:11, 6.62s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:57,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:22:57,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 420/892 [40:52<51:47, 6.58s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 420/892 [40:52<51:47, 6.58s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6681, 'learning_rate': 0.00025079999999999997, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:05,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [40:59<51:16, 6.53s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [40:59<51:16, 6.53s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4978, 'learning_rate': 0.0002514, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:12,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▎ | 422/892 [41:05<50:52, 6.49s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▎ | 422/892 [41:05<50:52, 6.49s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0288, 'learning_rate': 0.00025199999999999995, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:18,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 423/892 [41:11<50:24, 6.45s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 423/892 [41:11<50:24, 6.45s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9343, 'learning_rate': 0.00025259999999999996, 'epoch': 0.47} + 47%|██████████████████████████████████████▍ | 423/892 [41:11<50:24, 6.45s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 423/892 [41:11<50:24, 6.45s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:26,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:26,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:26,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:26,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:26,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 425/892 [41:25<51:00, 6.55s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:36,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:36,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:36,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▋ | 426/892 [41:31<50:14, 6.47s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:42,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:42,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:42,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 427/892 [41:37<49:24, 6.37s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:49,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:49,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:49,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 428/892 [41:43<48:52, 6.32s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:55,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:55,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:23:55,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▉ | 429/892 [41:49<48:18, 6.26s/it]g-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:01,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:01,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:01,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:22:23,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [41:55<47:45, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:05,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [41:55<47:45, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:05,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [41:55<47:45, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:05,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [41:55<47:45, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:05,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 431/892 [42:01<47:17, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:11,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 431/892 [42:01<47:17, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:11,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 431/892 [42:01<47:17, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:11,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 431/892 [42:01<47:17, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:11,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 432/892 [42:07<46:40, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 432/892 [42:07<46:40, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 432/892 [42:07<46:40, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 432/892 [42:07<46:40, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:17,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▎ | 433/892 [42:13<46:17, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▎ | 433/892 [42:13<46:17, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:28,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:28,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9024, 'learning_rate': 0.00025919999999999996, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:32,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:32,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▌ | 435/892 [42:25<44:54, 5.90s/it]g-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▌ | 435/892 [42:25<44:54, 5.90s/it]g-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:37,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:37,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▌ | 436/892 [42:30<44:05, 5.80s/it]g-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:42,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:44,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:44,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8932, 'learning_rate': 0.000261, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:48,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:48,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▊ | 438/892 [42:41<42:25, 5.61s/it]g-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:52,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:52,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:52,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:23,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▊ | 439/892 [42:47<41:24, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:59,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:24:59,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▉ | 440/892 [42:52<40:17, 5.35s/it]g-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:02,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:05,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:05,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9899, 'learning_rate': 0.00026339999999999995, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:08,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:08,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:24:56,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▏ | 442/892 [43:01<37:18, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:10,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:12,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:10,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:12,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:10,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▏ | 443/892 [43:05<35:25, 4.73s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:15,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:16,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:15,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:16,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:15,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▎ | 444/892 [43:09<33:33, 4.50s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:18,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:20,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:18,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:20,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:18,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▍ | 445/892 [43:13<31:37, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:22,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▍ | 445/892 [43:13<31:37, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:22,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 446/892 [43:16<29:24, 3.96s/it]g-point operations will not be computed-02 12:25:22,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:27,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:25,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:27,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:25,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 447/892 [43:19<27:03, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:28,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 447/892 [43:19<27:03, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:28,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▋ | 448/892 [43:21<24:43, 3.34s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:31,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▋ | 448/892 [43:21<24:43, 3.34s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:31,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 449/892 [43:24<22:19, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:33,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [43:26<21:16, 2.89s/it]g-point operations will not be computed-02 12:25:33,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [43:26<21:16, 2.89s/it]g-point operations will not be computed-02 12:25:33,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [43:26<21:16, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:37,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [43:26<21:16, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:37,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:40,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:37,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:40,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:37,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [43:34<31:30, 4.29s/it]g-point operations will not be computed-02 12:25:37,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [43:34<31:30, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:44,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [43:34<31:30, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:44,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:48,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:44,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:25:48,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:25:44,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 452/892 [43:41<37:42, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 452/892 [43:41<37:42, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 452/892 [43:41<37:42, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 452/892 [43:41<37:42, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [43:48<41:57, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [43:48<41:57, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [43:48<41:57, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [43:48<41:57, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [43:48<41:57, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:25:51,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [43:55<44:43, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [43:55<44:43, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [43:55<44:43, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [43:55<44:43, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [44:02<46:24, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [44:02<46:24, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:26:16,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 456/892 [44:09<47:37, 6.55s/it]g-point operations will not be computed-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 456/892 [44:09<47:37, 6.55s/it]g-point operations will not be computed-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.711, 'learning_rate': 0.0002724, 'epoch': 0.51} + 51%|█████████████████████████████████████████▍ | 456/892 [44:09<47:37, 6.55s/it]g-point operations will not be computed-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 456/892 [44:09<47:37, 6.55s/it]g-point operations will not be computed-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 456/892 [44:09<47:37, 6.55s/it]g-point operations will not be computed-02 12:26:05,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [44:16<48:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [44:16<48:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [44:16<48:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▌ | 458/892 [44:23<48:36, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▌ | 458/892 [44:23<48:36, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7766, 'learning_rate': 0.0002736, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-02 12:26:36,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [44:30<49:01, 6.79s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [44:30<49:01, 6.79s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7893, 'learning_rate': 0.0002742, 'epoch': 0.51} + 51%|█████████████████████████████████████████▋ | 459/892 [44:30<49:01, 6.79s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [44:30<49:01, 6.79s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [44:30<49:01, 6.79s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 460/892 [44:37<49:00, 6.81s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:26:49,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:26:49,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 461/892 [44:44<48:57, 6.82s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 461/892 [44:44<48:57, 6.82s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5892, 'learning_rate': 0.00027539999999999997, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-02 12:26:57,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [44:50<48:41, 6.80s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [44:50<48:41, 6.80s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9282, 'learning_rate': 0.000276, 'epoch': 0.52} + 52%|█████████████████████████████████████████▉ | 462/892 [44:50<48:41, 6.80s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [44:50<48:41, 6.80s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [44:50<48:41, 6.80s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████ | 463/892 [44:57<48:16, 6.75s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:09,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:09,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▏ | 464/892 [45:04<47:58, 6.73s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▏ | 464/892 [45:04<47:58, 6.73s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:15,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:15,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▏ | 465/892 [45:10<47:45, 6.71s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▏ | 465/892 [45:10<47:45, 6.71s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5684, 'learning_rate': 0.0002778, 'epoch': 0.52} + 52%|██████████████████████████████████████████▏ | 465/892 [45:10<47:45, 6.71s/it]g-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:25,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:25,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0256, 'learning_rate': 0.0002784, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:25,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:25,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:25,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:26:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▍ | 467/892 [45:23<46:53, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▍ | 467/892 [45:23<46:53, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▍ | 467/892 [45:23<46:53, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▍ | 467/892 [45:23<46:53, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▍ | 468/892 [45:30<46:25, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:41,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:41,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▌ | 469/892 [45:36<46:16, 6.56s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▌ | 469/892 [45:36<46:16, 6.56s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:48,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:48,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▋ | 470/892 [45:43<45:55, 6.53s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▋ | 470/892 [45:43<45:55, 6.53s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5782, 'learning_rate': 0.0002808, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-02 12:27:56,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 471/892 [45:49<45:35, 6.50s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 471/892 [45:49<45:35, 6.50s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.492, 'learning_rate': 0.00028139999999999996, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:02,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [45:56<45:09, 6.45s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [45:56<45:09, 6.45s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6235, 'learning_rate': 0.00028199999999999997, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:09,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▉ | 473/892 [46:02<44:36, 6.39s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▉ | 473/892 [46:02<44:36, 6.39s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0461, 'learning_rate': 0.0002826, 'epoch': 0.53} + 53%|██████████████████████████████████████████▉ | 473/892 [46:02<44:36, 6.39s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:16,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:16,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8847, 'learning_rate': 0.00028319999999999994, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:16,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:16,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▏ | 475/892 [46:15<44:48, 6.45s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▏ | 475/892 [46:15<44:48, 6.45s/it]g-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:26,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:26,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:27:33,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▏ | 476/892 [46:21<44:12, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:31,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▏ | 476/892 [46:21<44:12, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:31,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1263, 'learning_rate': 0.0002844, 'epoch': 0.53} + 53%|███████████████████████████████████████████▏ | 476/892 [46:21<44:12, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:31,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▎ | 477/892 [46:27<43:22, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:37,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▎ | 477/892 [46:27<43:22, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:37,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1252, 'learning_rate': 0.000285, 'epoch': 0.53} + 53%|███████████████████████████████████████████▎ | 477/892 [46:27<43:22, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:37,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 478/892 [46:33<42:41, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:43,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 478/892 [46:33<42:41, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:43,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7088, 'learning_rate': 0.00028559999999999995, 'epoch': 0.54} + 54%|███████████████████████████████████████████▍ | 478/892 [46:33<42:41, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:43,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 478/892 [46:33<42:41, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:43,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 479/892 [46:39<42:08, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 479/892 [46:39<42:08, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:53,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:53,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:53,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7786, 'learning_rate': 0.0002868, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:59,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:59,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6808, 'learning_rate': 0.00028739999999999994, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:59,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:28:59,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:05,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:05,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:09,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:09,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 483/892 [47:02<39:52, 5.85s/it]g-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:13,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:28:49,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▉ | 484/892 [47:08<39:12, 5.77s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:29:18,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:20,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:18,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 485/892 [47:13<38:32, 5.68s/it]g-point operations will not be computed-02 12:29:18,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 485/892 [47:13<38:32, 5.68s/it]g-point operations will not be computed-02 12:29:18,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:24,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:18,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:24,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:18,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:24,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:18,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████▏ | 486/892 [47:19<38:02, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████▏ | 486/892 [47:19<38:02, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:32,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:32,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7896, 'learning_rate': 0.00029099999999999997, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:36,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:36,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▎ | 488/892 [47:29<36:34, 5.43s/it]g-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:40,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:43,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:43,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9277, 'learning_rate': 0.00029219999999999995, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:46,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:46,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:29,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▍ | 490/892 [47:39<34:26, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:51,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▌ | 491/892 [47:44<33:01, 4.94s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▌ | 491/892 [47:44<33:01, 4.94s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:54,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:56,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:56,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:29:58,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:00,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:00,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:02,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:02,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:04,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:07,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:07,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:09,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:09,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:10,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:13,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:13,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:15,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:15,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:17,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:17,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:18,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-02 12:30:18,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2369] 2022-03-02 12:30:20,605 >> Batch size = 8aluation *****e number of tokens of the input, floating-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 0/331 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 2/331 [00:02<06:12, 1.13s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 3/331 [00:04<08:27, 1.55s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 4/331 [00:06<09:40, 1.78s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 5/331 [00:09<11:05, 2.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 6/331 [00:11<12:12, 2.25s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 7/331 [00:14<12:27, 2.31s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|██ | 8/331 [00:16<12:56, 2.41s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 9/331 [00:19<13:27, 2.51s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 10/331 [00:22<14:16, 2.67s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 11/331 [00:24<13:48, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 12/331 [00:27<13:40, 2.57s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 13/331 [00:30<13:30, 2.55s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 14/331 [00:32<13:24, 2.54s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 15/331 [00:35<14:37, 2.78s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 15/331 [00:35<14:37, 2.78s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 15/331 [00:35<14:37, 2.78s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 17/331 [00:42<15:37, 2.99s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 18/331 [00:44<14:20, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 19/331 [00:47<14:04, 2.71s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 20/331 [00:49<13:07, 2.53s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████▏ | 21/331 [00:52<13:36, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 22/331 [00:55<14:42, 2.86s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 22/331 [00:55<14:42, 2.86s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 22/331 [00:55<14:42, 2.86s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 24/331 [01:03<17:05, 3.34s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 25/331 [01:05<16:21, 3.21s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 26/331 [01:08<15:09, 2.98s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 27/331 [01:11<15:11, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▉ | 28/331 [01:14<14:45, 2.92s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 29/331 [01:16<14:23, 2.86s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 30/331 [01:19<13:44, 2.74s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▋ | 31/331 [01:21<13:07, 2.62s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 32/331 [01:24<12:46, 2.56s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▏ | 33/331 [01:26<12:46, 2.57s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▍ | 34/331 [01:29<12:46, 2.58s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 35/331 [01:32<12:55, 2.62s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▉ | 36/331 [01:35<13:35, 2.76s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 37/331 [01:38<14:15, 2.91s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▍ | 38/331 [01:41<14:26, 2.96s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 39/331 [01:44<14:27, 2.97s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▉ | 40/331 [01:46<13:20, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|██████████▏ | 41/331 [01:49<12:46, 2.64s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▍ | 42/331 [01:52<13:41, 2.84s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▋ | 43/331 [01:55<14:25, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▉ | 44/331 [01:59<14:52, 3.11s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 45/331 [02:01<14:01, 2.94s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 46/331 [02:03<12:58, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▋ | 47/331 [02:06<12:06, 2.56s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▉ | 48/331 [02:08<12:23, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 49/331 [02:11<12:56, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▍ | 50/331 [02:14<12:52, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▋ | 51/331 [02:17<13:13, 2.83s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 52/331 [02:20<12:43, 2.74s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▏ | 53/331 [02:23<12:44, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▍ | 54/331 [02:25<12:04, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 55/331 [02:28<13:04, 2.84s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 56/331 [02:31<12:50, 2.80s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|██████████████ | 57/331 [02:33<12:24, 2.72s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 58/331 [02:37<12:58, 2.85s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 59/331 [02:39<12:10, 2.69s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▊ | 60/331 [02:41<11:55, 2.64s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|███████████████ | 61/331 [02:44<12:14, 2.72s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▎ | 62/331 [02:47<12:09, 2.71s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▌ | 63/331 [02:51<13:15, 2.97s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▊ | 64/331 [02:53<12:45, 2.87s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 65/331 [02:56<12:36, 2.84s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████▎ | 66/331 [03:00<13:53, 3.15s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████▌ | 67/331 [03:03<14:24, 3.27s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▊ | 68/331 [03:07<14:27, 3.30s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████ | 69/331 [03:10<14:05, 3.23s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████▎ | 70/331 [03:13<13:50, 3.18s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████▌ | 71/331 [03:16<13:53, 3.21s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▊ | 72/331 [03:19<13:51, 3.21s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████ | 73/331 [03:22<13:26, 3.13s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▎ | 74/331 [03:25<13:07, 3.06s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▌ | 75/331 [03:28<13:14, 3.11s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▊ | 76/331 [03:31<12:32, 2.95s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|███████████████████ | 77/331 [03:34<12:17, 2.90s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 78/331 [03:36<11:49, 2.80s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▌ | 79/331 [03:39<11:26, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▊ | 80/331 [03:42<11:13, 2.68s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|████████████████████ | 81/331 [03:45<11:38, 2.79s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████▎ | 82/331 [03:47<11:20, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████▌ | 83/331 [03:50<11:42, 2.83s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████▊ | 84/331 [03:54<12:30, 3.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|█████████████████████ | 85/331 [03:56<11:35, 2.83s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|█████████████████████▎ | 86/331 [04:00<12:19, 3.02s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|█████████████████████▌ | 87/331 [04:02<11:57, 2.94s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▊ | 88/331 [04:05<11:39, 2.88s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████ | 89/331 [04:07<10:49, 2.68s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▎ | 90/331 [04:10<10:17, 2.56s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▌ | 91/331 [04:13<10:44, 2.69s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▊ | 92/331 [04:15<10:05, 2.53s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|███████████████████████ | 93/331 [04:17<10:07, 2.55s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|███████████████████████▎ | 94/331 [04:20<10:24, 2.64s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▌ | 95/331 [04:23<10:27, 2.66s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▊ | 96/331 [04:26<10:34, 2.70s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|████████████████████████ | 97/331 [04:28<10:08, 2.60s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████▎ | 98/331 [04:31<10:29, 2.70s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████▌ | 99/331 [04:34<10:27, 2.71s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████▍ | 100/331 [04:36<10:02, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 101/331 [04:39<10:00, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▉ | 102/331 [04:42<10:45, 2.82s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|█████████████████████████▏ | 103/331 [04:44<10:13, 2.69s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|█████████████████████████▍ | 104/331 [04:47<10:08, 2.68s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▋ | 105/331 [04:50<10:13, 2.72s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 106/331 [04:53<10:12, 2.72s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 107/331 [04:55<09:30, 2.55s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▍ | 108/331 [04:57<09:20, 2.51s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 109/331 [05:00<09:14, 2.50s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 110/331 [05:03<09:42, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 111/331 [05:05<09:47, 2.67s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 112/331 [05:08<09:51, 2.70s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▋ | 113/331 [05:10<09:26, 2.60s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▉ | 114/331 [05:13<09:29, 2.62s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|████████████████████████████▏ | 115/331 [05:16<09:27, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|████████████████████████████▍ | 116/331 [05:19<09:44, 2.72s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|████████████████████████████▋ | 117/331 [05:21<09:38, 2.71s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▉ | 118/331 [05:24<09:19, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████ | 119/331 [05:26<09:16, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▎ | 120/331 [05:29<09:11, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▌ | 121/331 [05:32<09:38, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▊ | 122/331 [05:35<09:28, 2.72s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████ | 123/331 [05:38<10:08, 2.93s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▎ | 124/331 [05:41<10:01, 2.91s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 125/331 [05:44<10:34, 3.08s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▊ | 126/331 [05:48<10:33, 3.09s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|███████████████████████████████ | 127/331 [05:51<10:58, 3.23s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▎ | 128/331 [05:54<10:59, 3.25s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 129/331 [05:58<10:44, 3.19s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 130/331 [06:01<10:52, 3.25s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 131/331 [06:04<11:04, 3.32s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 132/331 [06:07<10:29, 3.17s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 133/331 [06:10<09:50, 2.98s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▊ | 134/331 [06:13<09:34, 2.92s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████ | 135/331 [06:16<09:46, 2.99s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▎ | 136/331 [06:19<09:58, 3.07s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 137/331 [06:22<10:15, 3.17s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 138/331 [06:26<10:27, 3.25s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████ | 139/331 [06:28<09:21, 2.93s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 140/331 [06:32<09:58, 3.13s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 141/331 [06:34<09:27, 2.99s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▋ | 142/331 [06:37<09:09, 2.91s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▉ | 143/331 [06:40<09:31, 3.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▏ | 144/331 [06:43<09:06, 2.92s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▍ | 145/331 [06:46<08:58, 2.90s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▋ | 146/331 [06:49<09:27, 3.07s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▉ | 147/331 [06:52<09:05, 2.96s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▏ | 148/331 [06:54<08:29, 2.78s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▍ | 149/331 [06:57<07:59, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▋ | 150/331 [07:00<08:18, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 151/331 [07:02<08:08, 2.72s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 152/331 [07:05<07:49, 2.62s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 153/331 [07:07<07:44, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 153/331 [07:07<07:44, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 153/331 [07:07<07:44, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▉ | 155/331 [07:14<08:28, 2.89s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 156/331 [07:17<08:44, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 157/331 [07:20<09:02, 3.12s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▋ | 158/331 [07:23<09:09, 3.18s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▉ | 159/331 [07:27<09:14, 3.23s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 160/331 [07:30<08:45, 3.07s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▍ | 161/331 [07:32<08:27, 2.98s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▋ | 162/331 [07:36<08:51, 3.14s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▉ | 163/331 [07:39<08:54, 3.18s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▏ | 164/331 [07:42<08:26, 3.03s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▍ | 165/331 [07:45<08:11, 2.96s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 166/331 [07:47<08:02, 2.92s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 167/331 [07:51<08:10, 2.99s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 168/331 [07:53<07:43, 2.84s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 169/331 [07:56<07:48, 2.89s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▌ | 170/331 [07:58<07:22, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 171/331 [08:01<07:20, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████ | 172/331 [08:04<06:58, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 173/331 [08:07<07:11, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▌ | 174/331 [08:09<06:51, 2.62s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 175/331 [08:12<06:54, 2.66s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████ | 176/331 [08:14<06:40, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▎ | 177/331 [08:17<07:03, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▌ | 178/331 [08:21<07:30, 2.95s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 179/331 [08:24<07:56, 3.13s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 180/331 [08:27<07:46, 3.09s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▎ | 181/331 [08:30<07:40, 3.07s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▌ | 182/331 [08:32<07:00, 2.82s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▊ | 183/331 [08:35<06:26, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████ | 184/331 [08:37<05:58, 2.44s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▎ | 185/331 [08:39<05:37, 2.31s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▌ | 186/331 [08:41<05:45, 2.39s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▊ | 187/331 [08:44<06:15, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████ | 188/331 [08:47<06:15, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▎ | 189/331 [08:49<05:58, 2.52s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▍ | 190/331 [08:51<05:43, 2.44s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▋ | 191/331 [08:54<05:42, 2.44s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▉ | 192/331 [08:56<05:34, 2.41s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▏ | 193/331 [08:59<06:01, 2.62s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▍ | 194/331 [09:02<05:40, 2.48s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▋ | 195/331 [09:04<05:31, 2.43s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▉ | 196/331 [09:06<05:35, 2.49s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▏ | 197/331 [09:09<05:52, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▍ | 198/331 [09:12<05:37, 2.53s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▋ | 199/331 [09:14<05:41, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▋ | 199/331 [09:14<05:41, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▋ | 199/331 [09:14<05:41, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 61%|█████████████████████████████████████████████████▏ | 201/331 [09:19<05:17, 2.44s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 61%|█████████████████████████████████████████████████▍ | 202/331 [09:22<05:23, 2.51s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 61%|█████████████████████████████████████████████████▋ | 203/331 [09:24<05:26, 2.55s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|█████████████████████████████████████████████████▉ | 204/331 [09:27<05:47, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▏ | 205/331 [09:30<05:48, 2.77s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▍ | 206/331 [09:33<05:41, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▋ | 207/331 [09:36<05:53, 2.85s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▉ | 208/331 [09:39<05:56, 2.90s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████▏ | 209/331 [09:41<05:28, 2.70s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████▍ | 210/331 [09:44<05:06, 2.54s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▋ | 211/331 [09:46<05:12, 2.60s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▉ | 212/331 [09:49<04:57, 2.50s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████ | 213/331 [09:51<04:57, 2.52s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▎ | 214/331 [09:53<04:40, 2.40s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▌ | 215/331 [09:55<04:28, 2.31s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████��███████████████████████████████████▊ | 216/331 [09:59<04:58, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████ | 217/331 [10:01<04:57, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▎ | 218/331 [10:04<05:10, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▌ | 219/331 [10:07<05:08, 2.76s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▊ | 220/331 [10:09<04:52, 2.64s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████ | 221/331 [10:12<04:53, 2.67s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▎ | 222/331 [10:14<04:37, 2.55s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▌ | 223/331 [10:17<04:39, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▊ | 224/331 [10:20<04:41, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 225/331 [10:23<04:41, 2.65s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▎ | 226/331 [10:26<04:51, 2.78s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▌ | 227/331 [10:28<04:43, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 228/331 [10:31<04:35, 2.67s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████���███████████████████████ | 229/331 [10:33<04:31, 2.66s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████▎ | 230/331 [10:36<04:22, 2.60s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▌ | 231/331 [10:39<04:29, 2.70s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▊ | 232/331 [10:41<04:22, 2.65s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|█████████████████████████████████████████████████████████ | 233/331 [10:44<04:29, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▎ | 234/331 [10:47<04:14, 2.62s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▌ | 235/331 [10:49<04:03, 2.54s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▊ | 236/331 [10:53<04:28, 2.83s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|█████████████████████████████████████████████████████████▉ | 237/331 [10:56<04:39, 2.97s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|██████████████████████████████████████████████████████████▏ | 238/331 [10:59<04:34, 2.96s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|██████████████████████████████████████████████████████████▍ | 239/331 [11:02<04:36, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████▋ | 240/331 [11:05<04:38, 3.06s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████▉ | 241/331 [11:08<04:42, 3.14s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|███████████████████████████████████████████████████████████▏ | 242/331 [11:12<04:43, 3.18s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|███████████████████████████████████████████████████████████▍ | 243/331 [11:15<04:43, 3.22s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|███████████████████████████████████████████████████████████▋ | 244/331 [11:19<04:49, 3.32s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|███████████████████████████████████████████████████████████▉ | 245/331 [11:22<04:37, 3.22s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|████████████████████████████████████████████████████████████▏ | 246/331 [11:25<04:45, 3.36s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|████████████████████████████████████████████████████████████▍ | 247/331 [11:28<04:33, 3.26s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|████████████████████████████████████████████████████████████▋ | 248/331 [11:31<04:13, 3.05s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|████████████████████████████████████████████████████████████▉ | 249/331 [11:33<03:53, 2.85s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▏ | 250/331 [11:36<03:39, 2.71s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▍ | 251/331 [11:38<03:41, 2.76s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▋ | 252/331 [11:41<03:28, 2.64s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▉ | 253/331 [11:44<03:36, 2.77s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|██████████████████████████████████████████████████████████████▏ | 254/331 [11:46<03:28, 2.71s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|██████████████████████████████████████████████████████████████▍ | 255/331 [11:49<03:33, 2.81s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|██████████████████████████████████████████████████████████████▋ | 256/331 [11:52<03:24, 2.73s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|██████████████████████████████████████████████████████████████▉ | 257/331 [11:55<03:29, 2.83s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|███████████████████████████████████████████████████████████████▏ | 258/331 [11:57<03:14, 2.67s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|███████████████████████████████████████████████████████████████▍ | 259/331 [12:00<03:09, 2.64s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|███████████████████████████████████████████████████████████████▋ | 260/331 [12:03<03:12, 2.71s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|███████████████████████████████████████████████████████████████▊ | 261/331 [12:05<02:59, 2.56s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|████████████████████████████████████████████████████████████████ | 262/331 [12:08<02:57, 2.58s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|████████████████████████████████████████████████████████████████▎ | 263/331 [12:11<03:06, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|████████████████████████████████████████████████████████████████▌ | 264/331 [12:13<02:59, 2.68s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [12:16<02:53, 2.63s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|█████████████████████████████████████████████████████████████████ | 266/331 [12:18<02:48, 2.59s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|█████████████████████████████████████████████████████████████████▎ | 267/331 [12:22<02:58, 2.78s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|█████████████████████████████████████████████████████████████████▌ | 268/331 [12:24<02:53, 2.76s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|█████████████████████████████████████████████████████████████████▊ | 269/331 [12:28<03:01, 2.92s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████ | 270/331 [12:30<02:56, 2.89s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████▎ | 271/331 [12:34<02:59, 2.99s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████▌ | 272/331 [12:36<02:50, 2.89s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [12:39<02:49, 2.92s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|███████████████████████████████████████████████████████████████████ | 274/331 [12:43<02:54, 3.07s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|███████████████████████████████████████████████████████████████████▎ | 275/331 [12:46<02:54, 3.12s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|███████████████████████████████████████████████████████████████████▌ | 276/331 [12:48<02:42, 2.95s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|███████████████████████████████████████████████████████████████████▊ | 277/331 [12:51<02:35, 2.89s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|████████████████████████████████████████████████████████████████████ | 278/331 [12:54<02:29, 2.83s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|████████████████████████████████████████████████████████████████████▎ | 279/331 [12:57<02:38, 3.05s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|████████████████████████████████████████████████████████████████████▌ | 280/331 [13:00<02:31, 2.96s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|████████████████████████████████████████████████████████████████████▊ | 281/331 [13:03<02:31, 3.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|█████████████████████████████████████████████████████████████████████ | 282/331 [13:06<02:28, 3.03s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|█████████████████████████████████████████████████████████████████████▎ | 283/331 [13:10<02:28, 3.10s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|█████████████████████████████████████████████████████████████████████▍ | 284/331 [13:13<02:30, 3.21s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|█████████████████████████████████████████████████████████████████████▋ | 285/331 [13:17<02:30, 3.27s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|█████████████████████████████████████████████████████████████████████▉ | 286/331 [13:20<02:28, 3.30s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████████████████████████████████████████████████████▏ | 287/331 [13:24<02:29, 3.39s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████████████████████████████████████████████████████▍ | 288/331 [13:27<02:24, 3.36s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [13:30<02:12, 3.16s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|██████████████████████████████████████████████████████████████████████▉ | 290/331 [13:32<02:02, 2.98s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|███████████████████████████████████████████████████████████████████████▏ | 291/331 [13:35<01:52, 2.81s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|███████████████████████████████████████████████████████████████████████▍ | 292/331 [13:37<01:47, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|███████████████████████████████████████████████████████████████████████▋ | 293/331 [13:40<01:44, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|███████████████████████████████████████████████████████████████████████▉ | 294/331 [13:42<01:36, 2.61s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|████████████████████████████████████████████████████████████████████████▏ | 295/331 [13:45<01:31, 2.54s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|████████████████████████████████████████████████████████████████████████▍ | 296/331 [13:47<01:26, 2.47s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|████████████████████████████████████████████████████████████████████████▋ | 297/331 [13:50<01:33, 2.76s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|████████████████████████████████████████████████████████████████████████▉ | 298/331 [13:54<01:38, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [13:56<01:32, 2.89s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|█████████████████████████████████████████████████████████████████████████▍ | 300/331 [13:59<01:29, 2.88s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|█████████████████████████████████████████████████████████████████████████▋ | 301/331 [14:02<01:24, 2.81s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|█████████████████████████████████████████████████████████████████████████▉ | 302/331 [14:05<01:19, 2.75s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▏ | 303/331 [14:07<01:13, 2.64s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▍ | 304/331 [14:10<01:14, 2.74s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▋ | 305/331 [14:13<01:14, 2.86s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▉ | 306/331 [14:17<01:15, 3.03s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|███████████████████████████████████████████████████████████████████████████▏ | 307/331 [14:20<01:16, 3.18s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|███████████████████████████████████████████████████████████████████████████▎ | 308/331 [14:24<01:17, 3.38s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|███████████████████████████████████████████████████████████████████████████▌ | 309/331 [14:27<01:15, 3.42s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|███████████████████████████████████████████████████████████████████████████▊ | 310/331 [14:30<01:06, 3.17s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|████████████████████████████████████████████████████████████████████████████ | 311/331 [14:33<01:03, 3.18s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|████████████████████████████████████████████████████████████████████████████▎ | 312/331 [14:36<00:56, 2.98s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|████████████████████████████████████████████████████████████████████████████▌ | 313/331 [14:39<00:52, 2.93s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|████████████████████████████████████████████████████████████████████████████▊ | 314/331 [14:42<00:50, 2.95s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|█████████████████████████████████████████████████████████████████████████████ | 315/331 [14:45<00:48, 3.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|█████████████████████████████████████████████████████████████████████████████▎ | 316/331 [14:48<00:45, 3.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|█████████████████████████████████████████████████████████████████████████████▌ | 317/331 [14:51<00:44, 3.18s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|█████████████████████████████████████████████████████████████████████████████▊ | 318/331 [14:54<00:38, 2.98s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|██████████████████████████████████████████████████████████████████████████████ | 319/331 [14:56<00:34, 2.85s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▎ | 320/331 [14:59<00:31, 2.90s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▌ | 321/331 [15:02<00:28, 2.86s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [15:05<00:26, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [15:05<00:26, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [15:05<00:26, 3.00s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [15:12<00:21, 3.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|███████████████████████████████████████████████████████████████████████████████▌ | 325/331 [15:15<00:18, 3.04s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|█████████████████████████████████████████████��█████████████████████████████████▊ | 326/331 [15:18<00:15, 3.08s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|████████████████████████████████████████████████████████████████████████████████ | 327/331 [15:21<00:12, 3.11s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|████████████████████████████████████████████████████████████████████████████████▎| 328/331 [15:24<00:09, 3.14s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|████████████████████████████████████████████████████████████████████████████████▌| 329/331 [15:27<00:06, 3.10s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [15:31<00:03, 3.27s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [15:31<00:03, 3.27s/it]g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +03/02/2022 12:45:56 - INFO - datasets.metric - Removing /home/sanchit_huggingface_co/.cache/huggingface/metrics/wer/default/default_experiment-1-0.arrow +[INFO|configuration_utils.py:438] 2022-03-02 12:45:56,756 >> Configuration saved in ./checkpoint-500/config.json g-point operations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|feature_extraction_utils.py:324] 2022-03-02 12:46:01,751 >> Configuration saved in ./checkpoint-500/preprocessor_config.jsonerations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|feature_extraction_utils.py:324] 2022-03-02 12:46:01,751 >> Configuration saved in ./checkpoint-500/preprocessor_config.jsonerations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|feature_extraction_utils.py:324] 2022-03-02 12:46:01,751 >> Configuration saved in ./checkpoint-500/preprocessor_config.jsonerations will not be computed-02 12:29:49,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +03/02/2022 12:47:32 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20220302_114207-c11kvzxa/run-c11kvzxa.wandb']. This may take a bit of time if the files are large.