diff --git "a/wandb/run-20220317_164055-2lyj41rg/files/output.log" "b/wandb/run-20220317_164055-2lyj41rg/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220317_164055-2lyj41rg/files/output.log" @@ -0,0 +1,10278 @@ + + + 0%| | 0/17840 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:01,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:03,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0148, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:05,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 1/17840 [00:08<43:52:40, 8.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:07,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:09,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:11,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2566, 'learning_rate': 1.0000000000000001e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:13,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 2/17840 [00:16<41:41:34, 8.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:16,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:18,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:20,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0838, 'learning_rate': 2.0000000000000002e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 3/17840 [00:25<40:50:58, 8.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:23,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:25,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:27,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1289, 'learning_rate': 2.0000000000000002e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:29,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 4/17840 [00:32<39:17:28, 7.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:31,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:33,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:35,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:36,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9334, 'learning_rate': 3.0000000000000004e-07, 'epoch': 0.01} + 0%| | 5/17840 [00:39<38:31:17, 7.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:38,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:40,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:42,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0595, 'learning_rate': 4.0000000000000003e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:44,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 6/17840 [00:47<38:06:17, 7.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:46,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:48,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:49,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9876, 'learning_rate': 5.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:51,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 7/17840 [00:54<37:40:28, 7.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:53,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:55,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:57,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9236, 'learning_rate': 6.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:59,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 8/17840 [01:02<37:28:34, 7.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:01,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:03,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:04,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1163, 'learning_rate': 7.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:06,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 9/17840 [01:09<37:13:59, 7.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:08,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:10,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:12,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0041, 'learning_rate': 8.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:14,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 10/17840 [01:17<36:57:30, 7.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:15,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:17,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:19,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:21,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 11/17840 [01:24<36:39:31, 7.40s/it] + + 0%| | 11/17840 [01:24<36:39:31, 7.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:23,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:24,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:26,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0752, 'learning_rate': 1.0000000000000002e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:28,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 12/17840 [01:31<36:19:56, 7.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:30,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:32,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:33,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:35,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 13/17840 [01:38<36:08:05, 7.30s/it] + + 0%| | 13/17840 [01:38<36:08:05, 7.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:37,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:39,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:41,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0397, 'learning_rate': 1.2000000000000002e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:42,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 14/17840 [01:45<35:56:53, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:44,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:46,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:48,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:49,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 15/17840 [01:53<35:43:31, 7.22s/it] + + 0%| | 15/17840 [01:53<35:43:31, 7.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:51,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:53,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:55,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0296, 'learning_rate': 1.4000000000000001e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:56,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 16/17840 [02:00<35:23:46, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:58,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:00,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:02,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:04,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 17/17840 [02:07<35:13:56, 7.12s/it] + + 0%| | 17/17840 [02:07<35:13:56, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:05,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:07,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:09,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:10,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1036, 'learning_rate': 1.6000000000000001e-06, 'epoch': 0.02} + 0%| | 18/17840 [02:13<34:52:06, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:12,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:14,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:16,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8681, 'learning_rate': 1.7000000000000002e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:17,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 19/17840 [02:20<34:45:58, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:19,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:21,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:23,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:24,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 20/17840 [02:27<34:33:43, 6.98s/it] + + 0%| | 20/17840 [02:27<34:33:43, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:26,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:28,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:29,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:31,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9155, 'learning_rate': 1.9e-06, 'epoch': 0.02} + 0%| | 21/17840 [02:34<34:14:55, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:33,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:35,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:38,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 22/17840 [02:41<34:11:44, 6.91s/it] + 0%| | 22/17840 [02:41<34:11:44, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:40,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:41,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:43,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:45,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 23/17840 [02:48<33:56:55, 6.86s/it] + + 0%| | 23/17840 [02:48<33:56:55, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:46,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:48,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:50,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:51,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 24/17840 [02:54<33:44:11, 6.82s/it] + + 0%| | 24/17840 [02:54<33:44:11, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:53,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:55,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:56,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:00,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 25/17840 [03:03<36:40:20, 7.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:02,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8781, 'learning_rate': 2.3e-06, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:04,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:05,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:07,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 26/17840 [03:10<35:32:05, 7.18s/it] + 0%| | 26/17840 [03:10<35:32:05, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:09,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:12,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:09,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:12,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:09,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:16<34:28:53, 6.97s/it]g-point operations will not be computed-17 16:44:09,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:16<34:28:53, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:15,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:18,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:15,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:18,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:15,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:23<33:40:45, 6.81s/it]g-point operations will not be computed-17 16:44:15,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:23<33:40:45, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:21,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:23<33:40:45, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:21,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:23<33:40:45, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:21,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:29<33:06:44, 6.69s/it]g-point operations will not be computed-17 16:44:21,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|��� | 29/17840 [03:29<33:06:44, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:28,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:29<33:06:44, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:28,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:31,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:28,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:31,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:28,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:36<32:43:53, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:34,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:36<32:43:53, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:34,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:37,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:34,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:37,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:34,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:42<32:19:53, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:41,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:42<32:19:53, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:41,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:44,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:41,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:44,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:41,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:48<31:54:52, 6.45s/it]g-point operations will not be computed-17 16:44:41,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:48<31:54:52, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:47,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:50,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:47,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:50,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:47,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:54<31:32:49, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:53,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:54<31:32:49, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:53,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [04:00<30:49:45, 6.23s/it]g-point operations will not be computed-17 16:44:53,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [04:00<30:49:45, 6.23s/it]g-point operations will not be computed-17 16:44:53,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [04:00<30:49:45, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:59,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [04:00<30:49:45, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:59,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:02,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:59,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:02,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:59,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [04:06<30:15:05, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:05,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [04:06<30:15:05, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:05,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:12<29:49:50, 6.03s/it]g-point operations will not be computed-17 16:45:05,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:12<29:49:50, 6.03s/it]g-point operations will not be computed-17 16:45:05,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:12<29:49:50, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:11,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:13,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:11,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:13,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:11,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:18<29:18:35, 5.93s/it]g-point operations will not be computed-17 16:45:11,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:18<29:18:35, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:16,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:19,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:16,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:19,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:16,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [04:23<28:45:36, 5.82s/it]g-point operations will not be computed-17 16:45:16,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [04:23<28:45:36, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:22,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:29<28:10:42, 5.70s/it]g-point operations will not be computed-17 16:45:22,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:29<28:10:42, 5.70s/it]g-point operations will not be computed-17 16:45:22,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:29<28:10:42, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:27,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:27,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:27,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:34<27:28:40, 5.56s/it]g-point operations will not be computed-17 16:45:27,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:34<27:28:40, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:32,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:35,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:32,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:35,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:32,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:39<26:39:54, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:37,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:39,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:37,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:39,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:37,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:44<25:39:29, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:44,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:48<24:34:50, 4.97s/it]g-point operations will not be computed-17 16:45:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:48<24:34:50, 4.97s/it]g-point operations will not be computed-17 16:45:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:48<24:34:50, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:46,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:52<23:17:34, 4.71s/it]g-point operations will not be computed-17 16:45:46,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:52<23:17:34, 4.71s/it]g-point operations will not be computed-17 16:45:46,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:52,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:50,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:52,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:50,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:56<21:43:34, 4.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:54,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:59<20:01:30, 4.05s/it]g-point operations will not be computed-17 16:45:54,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:59<20:01:30, 4.05s/it]g-point operations will not be computed-17 16:45:54,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:59<20:01:30, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:57,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:59<20:01:30, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:57,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 47/17840 [05:02<18:25:50, 3.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:00,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [05:05<16:44:50, 3.39s/it]g-point operations will not be computed-17 16:46:00,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [05:05<16:44:50, 3.39s/it]g-point operations will not be computed-17 16:46:00,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 49/17840 [05:07<15:17:15, 3.09s/it]g-point operations will not be computed-17 16:46:02,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 49/17840 [05:07<15:17:15, 3.09s/it]g-point operations will not be computed-17 16:46:02,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:06,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:05,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:11<16:43:56, 3.39s/it]g-point operations will not be computed-17 16:46:05,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:11<16:43:56, 3.39s/it]g-point operations will not be computed-17 16:46:05,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:11<16:43:56, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:11<16:43:56, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:14,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:19<23:27:21, 4.75s/it]g-point operations will not be computed-17 16:46:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:19<23:27:21, 4.75s/it]g-point operations will not be computed-17 16:46:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:19<23:27:21, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:18,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:19<23:27:21, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:18,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:22,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:18,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:22,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:18,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:27<27:40:06, 5.60s/it]g-point operations will not be computed-17 16:46:18,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:27<27:40:06, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:26,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:27<27:40:06, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:26,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:29,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:26,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:29,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:26,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:34<30:41:46, 6.21s/it]g-point operations will not be computed-17 16:46:26,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:34<30:41:46, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:33,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:34<30:41:46, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:33,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:42<32:29:01, 6.57s/it]g-point operations will not be computed-17 16:46:33,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:42<32:29:01, 6.57s/it]g-point operations will not be computed-17 16:46:33,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:42<32:29:01, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:42<32:29:01, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:44,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:49<33:36:19, 6.80s/it]g-point operations will not be computed-17 16:46:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:49<33:36:19, 6.80s/it]g-point operations will not be computed-17 16:46:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:49<33:36:19, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:48,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:49<33:36:19, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:48,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:52,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:48,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:52,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:48,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:57<34:28:43, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:55,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:57<34:28:43, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:55,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:59,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:55,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [06:04<35:04:55, 7.10s/it]g-point operations will not be computed-17 16:46:55,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [06:04<35:04:55, 7.10s/it]g-point operations will not be computed-17 16:46:55,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [06:04<35:04:55, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:03,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [06:04<35:04:55, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:03,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:06,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:03,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [06:11<35:19:53, 7.15s/it]g-point operations will not be computed-17 16:47:03,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [06:11<35:19:53, 7.15s/it]g-point operations will not be computed-17 16:47:03,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [06:11<35:19:53, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:10,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:14,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:10,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:18<35:27:38, 7.18s/it]g-point operations will not be computed-17 16:47:10,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:18<35:27:38, 7.18s/it]g-point operations will not be computed-17 16:47:10,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:18<35:27:38, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:17,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:18<35:27:38, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:17,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:21,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:17,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:26<35:29:00, 7.18s/it]g-point operations will not be computed-17 16:47:17,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:26<35:29:00, 7.18s/it]g-point operations will not be computed-17 16:47:17,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:26<35:29:00, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:24,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:26<35:29:00, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:24,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:33<35:32:28, 7.20s/it]g-point operations will not be computed-17 16:47:24,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:33<35:32:28, 7.20s/it]g-point operations will not be computed-17 16:47:24,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:33<35:32:28, 7.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:32,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:33<35:32:28, 7.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:32,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:35,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:32,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:40<35:22:08, 7.16s/it]g-point operations will not be computed-17 16:47:32,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:40<35:22:08, 7.16s/it]g-point operations will not be computed-17 16:47:32,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:40<35:22:08, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:40<35:22:08, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:47<35:13:03, 7.13s/it]g-point operations will not be computed-17 16:47:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:47<35:13:03, 7.13s/it]g-point operations will not be computed-17 16:47:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:47<35:13:03, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:46,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:47<35:13:03, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:46,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:49,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:46,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:54<35:03:31, 7.10s/it]g-point operations will not be computed-17 16:47:46,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:54<35:03:31, 7.10s/it]g-point operations will not be computed-17 16:47:46,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:54<35:03:31, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:53,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:56,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:53,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [07:01<34:57:51, 7.08s/it]g-point operations will not be computed-17 16:47:53,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [07:01<34:57:51, 7.08s/it]g-point operations will not be computed-17 16:47:53,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [07:01<34:57:51, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:00,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [07:01<34:57:51, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:00,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:03,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:00,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [07:08<34:44:59, 7.04s/it]g-point operations will not be computed-17 16:48:00,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [07:08<34:44:59, 7.04s/it]g-point operations will not be computed-17 16:48:00,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [07:08<34:44:59, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:07,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:10,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:07,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [07:15<34:38:46, 7.02s/it]g-point operations will not be computed-17 16:48:07,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [07:15<34:38:46, 7.02s/it]g-point operations will not be computed-17 16:48:07,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [07:15<34:38:46, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:14,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [07:15<34:38:46, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:14,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:22<34:20:55, 6.96s/it]g-point operations will not be computed-17 16:48:14,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:22<34:20:55, 6.96s/it]g-point operations will not be computed-17 16:48:14,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:22<34:20:55, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:20,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:22<34:20:55, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:20,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:24,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:20,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:29<34:11:00, 6.92s/it]g-point operations will not be computed-17 16:48:20,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:29<34:11:00, 6.92s/it]g-point operations will not be computed-17 16:48:20,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:29<34:11:00, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:27,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:31,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:27,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:31,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:27,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:35<34:03:21, 6.90s/it]g-point operations will not be computed-17 16:48:27,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:35<34:03:21, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:34,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:38,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:34,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:38,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:34,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:42<33:55:51, 6.87s/it]g-point operations will not be computed-17 16:48:34,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:42<33:55:51, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:41,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:42<33:55:51, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:41,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:44,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:41,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:44,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:41,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:49<33:48:06, 6.85s/it]g-point operations will not be computed-17 16:48:41,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:49<33:48:06, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:48,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:51,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:48,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:51,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:48,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:56<33:27:02, 6.78s/it]g-point operations will not be computed-17 16:48:48,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:56<33:27:02, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:54,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:58,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:54,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:58,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:54,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [08:02<33:21:22, 6.76s/it]g-point operations will not be computed-17 16:48:54,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [08:02<33:21:22, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:01,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [08:02<33:21:22, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:01,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:04,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:01,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:04,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:01,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [08:11<36:29:35, 7.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [08:11<36:29:35, 7.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:13,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:13,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [08:18<35:19:14, 7.16s/it]g-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:18,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:18,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:18,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:24<34:19:41, 6.96s/it]g-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:24<34:19:41, 6.96s/it]g-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:24<34:19:41, 6.96s/it]g-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:24<34:19:41, 6.96s/it]g-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:28,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:28,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:28,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:28,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:34,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:34,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:34,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:40,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:40,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5051, 'learning_rate': 7.8e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:40,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:40,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:40,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:10,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:50<31:56:12, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:48,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:50<31:56:12, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:48,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:50<31:56:12, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:48,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:50<31:56:12, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:48,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:56<31:23:10, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:54,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:56<31:23:10, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:54,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:56<31:23:10, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:54,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:56<31:23:10, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:54,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [09:02<31:00:17, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [09:02<31:00:17, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:05,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:05,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.527, 'learning_rate': 8.200000000000001e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:05,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:11,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:11,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4725, 'learning_rate': 8.3e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:15,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:15,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 86/17840 [09:20<29:30:56, 5.98s/it]g-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 86/17840 [09:20<29:30:56, 5.98s/it]g-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:21,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:21,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 87/17840 [09:25<29:00:25, 5.88s/it]g-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:25,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:25,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:25,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:00,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [09:31<28:23:06, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:29,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [09:31<28:23:06, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:29,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [09:31<28:23:06, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:29,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:33,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:29,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:36,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:29,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:36,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:29,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:36,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:29,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 90/17840 [09:41<27:05:54, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:42,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:42,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 91/17840 [09:46<26:08:03, 5.30s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:45,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:48,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:48,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:50,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:52,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:52,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:54,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:56,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:56,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:58,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:00,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:00,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:02,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:03,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:03,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:06,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:06,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:08,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:11,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:11,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:13,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:16,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:16,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.617, 'learning_rate': 9.800000000000001e-06, 'epoch': 0.11} +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:20,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:20,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:24,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:24,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3614, 'learning_rate': 9.900000000000002e-06, 'epoch': 0.11} +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:24,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:24,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 102/17840 [10:35<28:26:33, 5.77s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 102/17840 [10:35<28:26:33, 5.77s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3876, 'learning_rate': 1e-05, 'epoch': 0.11} + 1%|▍ | 102/17840 [10:35<28:26:33, 5.77s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 102/17840 [10:35<28:26:33, 5.77s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:42<31:00:38, 6.29s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:42<31:00:38, 6.29s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5109, 'learning_rate': 1.0100000000000002e-05, 'epoch': 0.12} + 1%|▍ | 103/17840 [10:42<31:00:38, 6.29s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:47,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:47,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3972, 'learning_rate': 1.02e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:47,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:47,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:57<34:07:49, 6.93s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:57<34:07:49, 6.93s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.236, 'learning_rate': 1.03e-05, 'epoch': 0.12} + 1%|▍ | 105/17840 [10:57<34:07:49, 6.93s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:57<34:07:49, 6.93s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [11:05<34:45:01, 7.05s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [11:05<34:45:01, 7.05s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.477, 'learning_rate': 1.04e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:07,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [11:12<35:05:31, 7.12s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [11:12<35:05:31, 7.12s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4439, 'learning_rate': 1.05e-05, 'epoch': 0.12} + 1%|▍ | 107/17840 [11:12<35:05:31, 7.12s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [11:12<35:05:31, 7.12s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:19<35:20:13, 7.17s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:19<35:20:13, 7.17s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6277, 'learning_rate': 1.06e-05, 'epoch': 0.12} + 1%|▍ | 108/17840 [11:19<35:20:13, 7.17s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:19<35:20:13, 7.17s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:19<35:20:13, 7.17s/it]g-point operations will not be computed-17 16:50:39,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [11:27<35:36:13, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [11:27<35:36:13, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [11:27<35:36:13, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:34<35:36:47, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:34<35:36:47, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3082, 'learning_rate': 1.08e-05, 'epoch': 0.12} + 1%|▍ | 110/17840 [11:34<35:36:47, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:34<35:36:47, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:34<35:36:47, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 111/17840 [11:41<35:26:42, 7.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:42,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:42,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:48<35:18:30, 7.17s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:48<35:18:30, 7.17s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3719, 'learning_rate': 1.1000000000000001e-05, 'epoch': 0.13} + 1%|▍ | 112/17840 [11:48<35:18:30, 7.17s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:48<35:18:30, 7.17s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:48<35:18:30, 7.17s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 113/17840 [11:55<35:06:14, 7.13s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:56,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:56,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [12:02<35:05:14, 7.13s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [12:02<35:05:14, 7.13s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2712, 'learning_rate': 1.1200000000000001e-05, 'epoch': 0.13} + 1%|▍ | 114/17840 [12:02<35:05:14, 7.13s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:06,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:06,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3186, 'learning_rate': 1.13e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:06,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:06,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 116/17840 [12:16<34:40:26, 7.04s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 116/17840 [12:16<34:40:26, 7.04s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.151, 'learning_rate': 1.1400000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:18,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [12:23<34:32:58, 7.02s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [12:23<34:32:58, 7.02s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4425, 'learning_rate': 1.1500000000000002e-05, 'epoch': 0.13} + 1%|▍ | 117/17840 [12:23<34:32:58, 7.02s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [12:23<34:32:58, 7.02s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [12:30<34:17:17, 6.97s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [12:30<34:17:17, 6.97s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [12:37<34:05:33, 6.93s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [12:37<34:05:33, 6.93s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4933, 'learning_rate': 1.1700000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:39,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:39,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:44<33:54:57, 6.89s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:44<33:54:57, 6.89s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:44<33:54:57, 6.89s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:47,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:47,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4078, 'learning_rate': 1.19e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:47,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:47,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:47,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 122/17840 [12:57<33:26:32, 6.79s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:57,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:57,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:57,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [13:04<33:15:14, 6.76s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [13:04<33:15:14, 6.76s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [13:04<33:15:14, 6.76s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [13:10<33:03:46, 6.72s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [13:10<33:03:46, 6.72s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4599, 'learning_rate': 1.22e-05, 'epoch': 0.14} + 1%|▌ | 124/17840 [13:10<33:03:46, 6.72s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [13:10<33:03:46, 6.72s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [13:10<33:03:46, 6.72s/it]g-point operations will not be computed-17 16:52:26,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:19<36:11:47, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:19<36:11:47, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:19<36:11:47, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:19<36:11:47, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [13:26<34:58:40, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [13:26<34:58:40, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:28,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:28,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [13:32<34:06:32, 6.93s/it]g-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [13:32<34:06:32, 6.93s/it]g-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:34,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:39<33:22:54, 6.78s/it]g-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:39<33:22:54, 6.78s/it]g-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3651, 'learning_rate': 1.2600000000000001e-05, 'epoch': 0.14} + 1%|▌ | 128/17840 [13:39<33:22:54, 6.78s/it]g-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:42,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:42,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2908, 'learning_rate': 1.27e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:42,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:48,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:48,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5054, 'learning_rate': 1.2800000000000001e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:48,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:48,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:48,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:18,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:58<31:51:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:56,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:58<31:51:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:56,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:58<31:51:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:56,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:58<31:51:42, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:56,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [14:04<31:22:59, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:02,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [14:04<31:22:59, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:02,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [14:04<31:22:59, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:02,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [14:04<31:22:59, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:02,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [14:10<30:56:43, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [14:10<30:56:43, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:13,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:13,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4504, 'learning_rate': 1.32e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:13,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:19,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:19,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.31, 'learning_rate': 1.3300000000000001e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:23,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [14:27<29:22:44, 5.97s/it]g-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [14:27<29:22:44, 5.97s/it]g-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:27,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:27,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:27,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:08,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 137/17840 [14:33<28:50:11, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 137/17840 [14:33<28:50:11, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:35,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:35,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4361, 'learning_rate': 1.3600000000000002e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:39,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 139/17840 [14:44<27:26:45, 5.58s/it]g-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 139/17840 [14:44<27:26:45, 5.58s/it]g-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:43,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:46,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:46,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2478, 'learning_rate': 1.3800000000000002e-05, 'epoch': 0.16} +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:49,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:49,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 141/17840 [14:53<25:19:54, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:54,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 142/17840 [14:58<24:08:20, 4.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 142/17840 [14:58<24:08:20, 4.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:58,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 143/17840 [15:02<22:52:10, 4.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:00,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 143/17840 [15:02<22:52:10, 4.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:00,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:01,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:00,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:01,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:00,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 144/17840 [15:05<21:27:13, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:03,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 145/17840 [15:09<20:00:42, 4.07s/it]g-point operations will not be computed-17 16:56:03,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 145/17840 [15:09<20:00:42, 4.07s/it]g-point operations will not be computed-17 16:56:03,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:08,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:07,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 146/17840 [15:12<18:41:47, 3.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:10,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 146/17840 [15:12<18:41:47, 3.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:10,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 147/17840 [15:15<17:22:48, 3.54s/it]g-point operations will not be computed-17 16:56:10,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 147/17840 [15:15<17:22:48, 3.54s/it]g-point operations will not be computed-17 16:56:10,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:14,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:13,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:14,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:13,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:16,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:15,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 149/17840 [15:20<14:51:19, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:18,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 149/17840 [15:20<14:51:19, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:18,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:18,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 150/17840 [15:24<16:40:11, 3.39s/it]g-point operations will not be computed-17 16:56:18,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 150/17840 [15:24<16:40:11, 3.39s/it]g-point operations will not be computed-17 16:56:18,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 150/17840 [15:24<16:40:11, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:23,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 150/17840 [15:24<16:40:11, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:23,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:27,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:23,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:32<23:16:58, 4.74s/it]g-point operations will not be computed-17 16:56:23,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:32<23:16:58, 4.74s/it]g-point operations will not be computed-17 16:56:23,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:32<23:16:58, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:32<23:16:58, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:32<23:16:58, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 152/17840 [15:40<27:27:33, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 152/17840 [15:40<27:27:33, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3382, 'learning_rate': 1.5e-05, 'epoch': 0.17} + 1%|▋ | 152/17840 [15:40<27:27:33, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:44,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:44,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4166, 'learning_rate': 1.51e-05, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:44,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:44,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:55<32:10:52, 6.55s/it]g-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:55<32:10:52, 6.55s/it]g-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.265, 'learning_rate': 1.52e-05, 'epoch': 0.17} + 1%|▋ | 154/17840 [15:55<32:10:52, 6.55s/it]g-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:55<32:10:52, 6.55s/it]g-point operations will not be computed-17 16:56:31,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [16:02<33:25:14, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [16:02<33:25:14, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2423, 'learning_rate': 1.53e-05, 'epoch': 0.17} + 1%|▋ | 155/17840 [16:02<33:25:14, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [16:09<34:05:23, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [16:09<34:05:23, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2975, 'learning_rate': 1.54e-05, 'epoch': 0.17} + 1%|▋ | 156/17840 [16:09<34:05:23, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [16:09<34:05:23, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [16:09<34:05:23, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:01,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [16:16<34:29:16, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [16:16<34:29:16, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [16:16<34:29:16, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [16:16<34:29:16, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:24<34:46:42, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:24<34:46:42, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:24<34:46:42, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:24<34:46:42, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:24<34:46:42, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [16:31<34:54:11, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [16:31<34:54:11, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:33,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:33,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [16:38<35:01:54, 7.13s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [16:38<35:01:54, 7.13s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [16:38<35:01:54, 7.13s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [16:38<35:01:54, 7.13s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [16:38<35:01:54, 7.13s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 161/17840 [16:45<34:50:35, 7.10s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:52<34:37:21, 7.05s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:52<34:37:21, 7.05s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:52<34:37:21, 7.05s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:52<34:37:21, 7.05s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:52<34:37:21, 7.05s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:59<34:29:57, 7.03s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:59,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:59,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:59,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [17:06<34:22:58, 7.00s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [17:06<34:22:58, 7.00s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [17:06<34:22:58, 7.00s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:10,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:10,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4037, 'learning_rate': 1.63e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:10,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:10,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:10,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [17:20<34:01:17, 6.93s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:20,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:20,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:20,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [17:26<33:53:50, 6.90s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [17:26<33:53:50, 6.90s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:29,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [17:33<33:46:49, 6.88s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [17:33<33:46:49, 6.88s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1465, 'learning_rate': 1.66e-05, 'epoch': 0.19} + 1%|▋ | 168/17840 [17:33<33:46:49, 6.88s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [17:33<33:46:49, 6.88s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [17:33<33:46:49, 6.88s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 169/17840 [17:40<33:32:17, 6.83s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:40,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:40,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:40,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [17:47<33:26:08, 6.81s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [17:47<33:26:08, 6.81s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:49,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:53<33:15:04, 6.77s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:53<33:15:04, 6.77s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5178, 'learning_rate': 1.69e-05, 'epoch': 0.19} + 1%|▋ | 171/17840 [17:53<33:15:04, 6.77s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:57,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:57,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4713, 'learning_rate': 1.7000000000000003e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:57,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:57,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:57,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [18:07<32:52:33, 6.70s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [18:07<32:52:33, 6.70s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:09,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:09,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [18:13<32:39:19, 6.65s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [18:13<32:39:19, 6.65s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:15,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [18:22<35:51:39, 7.31s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [18:22<35:51:39, 7.31s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3283, 'learning_rate': 1.73e-05, 'epoch': 0.2} + 1%|▋ | 175/17840 [18:22<35:51:39, 7.31s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [18:22<35:51:39, 7.31s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [18:22<35:51:39, 7.31s/it]g-point operations will not be computed-17 16:57:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [18:29<34:52:48, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [18:29<34:52:48, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [18:29<34:52:48, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [18:29<34:52:48, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [18:35<33:48:59, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:35,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:35,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:35,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 178/17840 [18:42<33:01:08, 6.73s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:42,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:42,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:42,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [18:48<32:16:59, 6.58s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [18:48<32:16:59, 6.58s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:49,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:49,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 180/17840 [18:54<31:44:02, 6.47s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 180/17840 [18:54<31:44:02, 6.47s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:56,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:56,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [19:00<31:14:17, 6.37s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [19:00<31:14:17, 6.37s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:02,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:02,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [19:06<30:55:34, 6.31s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [19:06<30:55:34, 6.31s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:08,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:08,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 183/17840 [19:12<30:34:38, 6.23s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:12,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:12,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:12,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 184/17840 [19:18<30:03:05, 6.13s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:18,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:18,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:18,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [19:24<29:31:19, 6.02s/it]g-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:24,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:24,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:24,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:59:27,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 186/17840 [19:30<28:57:57, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 186/17840 [19:30<28:57:57, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:32,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:32,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5196, 'learning_rate': 1.85e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:36,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:36,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 188/17840 [19:41<28:04:54, 5.73s/it]g-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:40,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:43,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:43,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3254, 'learning_rate': 1.87e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:47,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 190/17840 [19:51<26:49:19, 5.47s/it]g-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 190/17840 [19:51<26:49:19, 5.47s/it]g-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:51,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:53,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:53,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4484, 'learning_rate': 1.8900000000000002e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:57,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:57,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 192/17840 [20:01<25:00:06, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:01,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 193/17840 [20:05<23:58:01, 4.89s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 193/17840 [20:05<23:58:01, 4.89s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:04,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:06,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:06,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:08,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:08,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:10,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:12,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:12,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:15,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:16,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:16,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:19,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:19,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:21,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:21,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:22,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:25,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:25,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.778, 'learning_rate': 1.9800000000000004e-05, 'epoch': 0.22} +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:29,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:29,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:33,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:33,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1823, 'learning_rate': 1.9900000000000003e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:37,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:37,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:44<27:27:36, 5.60s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:44<27:27:36, 5.60s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3117, 'learning_rate': 2e-05, 'epoch': 0.23} + 1%|▊ | 202/17840 [20:44<27:27:36, 5.60s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:44<27:27:36, 5.60s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 203/17840 [20:51<30:25:56, 6.21s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 203/17840 [20:51<30:25:56, 6.21s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1939, 'learning_rate': 2.01e-05, 'epoch': 0.23} + 1%|▊ | 203/17840 [20:51<30:25:56, 6.21s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:56,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:56,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.241, 'learning_rate': 2.0200000000000003e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:56,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:56,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [21:06<33:25:10, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [21:06<33:25:10, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1395, 'learning_rate': 2.0300000000000002e-05, 'epoch': 0.23} + 1%|▊ | 205/17840 [21:06<33:25:10, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [21:06<33:25:10, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [21:14<34:15:11, 6.99s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [21:14<34:15:11, 6.99s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1591, 'learning_rate': 2.04e-05, 'epoch': 0.23} + 1%|▉ | 206/17840 [21:14<34:15:11, 6.99s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:18,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:18,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2205, 'learning_rate': 2.05e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:18,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:18,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 208/17840 [21:28<35:03:57, 7.16s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 208/17840 [21:28<35:03:57, 7.16s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1156, 'learning_rate': 2.06e-05, 'epoch': 0.23} + 1%|▉ | 208/17840 [21:28<35:03:57, 7.16s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:32,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:32,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3496, 'learning_rate': 2.07e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:32,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:32,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [21:43<35:14:09, 7.20s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [21:43<35:14:09, 7.20s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2672, 'learning_rate': 2.08e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:45,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [21:50<35:05:47, 7.17s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [21:50<35:05:47, 7.17s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2128, 'learning_rate': 2.09e-05, 'epoch': 0.24} + 1%|▉ | 211/17840 [21:50<35:05:47, 7.17s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [21:50<35:05:47, 7.17s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 212/17840 [21:57<35:03:13, 7.16s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 212/17840 [21:57<35:03:13, 7.16s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3622, 'learning_rate': 2.1e-05, 'epoch': 0.24} + 1%|▉ | 212/17840 [21:57<35:03:13, 7.16s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3001, 'learning_rate': 2.11e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [22:11<34:45:58, 7.10s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [22:11<34:45:58, 7.10s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3397, 'learning_rate': 2.12e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:13,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:13,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [22:18<34:27:04, 7.04s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [22:18<34:27:04, 7.04s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [22:18<34:27:04, 7.04s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [22:18<34:27:04, 7.04s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [22:25<34:28:57, 7.04s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [22:25<34:28:57, 7.04s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:25,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:25,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 217/17840 [22:32<34:20:09, 7.01s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 217/17840 [22:32<34:20:09, 7.01s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3529, 'learning_rate': 2.15e-05, 'epoch': 0.24} + 1%|▉ | 217/17840 [22:32<34:20:09, 7.01s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:36,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:36,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:36,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2741, 'learning_rate': 2.16e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:36,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 219/17840 [22:46<34:06:27, 6.97s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 219/17840 [22:46<34:06:27, 6.97s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3483, 'learning_rate': 2.1700000000000002e-05, 'epoch': 0.25} + 1%|▉ | 219/17840 [22:46<34:06:27, 6.97s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 219/17840 [22:46<34:06:27, 6.97s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:50,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:50,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:50,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:50,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:50,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [23:00<33:47:13, 6.90s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:00,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:00,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:00,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [23:06<33:34:35, 6.86s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [23:06<33:34:35, 6.86s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:08,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:08,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [23:13<33:21:48, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [23:13<33:21:48, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [23:13<33:21:48, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [23:13<33:21:48, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [23:13<33:21:48, 6.82s/it]g-point operations will not be computed-17 17:00:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [23:20<33:03:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [23:20<33:03:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [23:20<33:03:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [23:20<33:03:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [23:29<36:21:56, 7.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [23:29<36:21:56, 7.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:31,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:31,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [23:35<35:05:46, 7.17s/it]g-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [23:35<35:05:46, 7.17s/it]g-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [23:35<35:05:46, 7.17s/it]g-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:39,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:39,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3265, 'learning_rate': 2.25e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:39,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2261, 'learning_rate': 2.26e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 229/17840 [23:54<32:22:24, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 229/17840 [23:54<32:22:24, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:57,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:57,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3269, 'learning_rate': 2.2800000000000002e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:57,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:04,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:04,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2721, 'learning_rate': 2.29e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:04,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:04,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:04,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 232/17840 [24:13<31:01:23, 6.34s/it]g-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:13,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:13,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:13,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:53,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [24:19<30:29:00, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:17,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [24:19<30:29:00, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:17,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [24:19<30:29:00, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:17,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [24:19<30:29:00, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:17,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 234/17840 [24:25<29:59:48, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 234/17840 [24:25<29:59:48, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:27,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:27,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4523, 'learning_rate': 2.3300000000000004e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:32,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:32,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 236/17840 [24:36<29:00:42, 5.93s/it]g-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:36,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:36,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:36,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [24:42<28:28:23, 5.82s/it]g-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:42,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:44,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:44,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5609, 'learning_rate': 2.36e-05, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:48,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:48,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 239/17840 [24:53<27:23:03, 5.60s/it]g-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:52,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:52,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:52,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:23,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 240/17840 [24:58<26:40:24, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:58,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:58,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 241/17840 [25:03<25:53:49, 5.30s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:02,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:04,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:04,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:06,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:08,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:08,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:10,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:12,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:12,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:14,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:14,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:16,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:19,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:19,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:21,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:21,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:22,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:24,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:24,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:27,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:27,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:28,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:31,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:31,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3225, 'learning_rate': 2.48e-05, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:35,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:35,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:39,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:39,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.51, 'learning_rate': 2.4900000000000002e-05, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:43,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:43,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [25:50<27:15:14, 5.58s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [25:50<27:15:14, 5.58s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1788, 'learning_rate': 2.5e-05, 'epoch': 0.28} + 1%|█ | 252/17840 [25:50<27:15:14, 5.58s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [25:50<27:15:14, 5.58s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [25:50<27:15:14, 5.58s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [25:57<29:58:28, 6.14s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [25:57<29:58:28, 6.14s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:59,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [26:04<31:41:49, 6.49s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [26:04<31:41:49, 6.49s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3818, 'learning_rate': 2.5200000000000003e-05, 'epoch': 0.28} + 1%|█ | 254/17840 [26:04<31:41:49, 6.49s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [26:04<31:41:49, 6.49s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [26:12<32:52:45, 6.73s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [26:12<32:52:45, 6.73s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2213, 'learning_rate': 2.5300000000000002e-05, 'epoch': 0.29} + 1%|█ | 255/17840 [26:12<32:52:45, 6.73s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.242, 'learning_rate': 2.54e-05, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [26:26<34:08:43, 6.99s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [26:26<34:08:43, 6.99s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3769, 'learning_rate': 2.5500000000000003e-05, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:28,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 258/17840 [26:33<34:25:27, 7.05s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 258/17840 [26:33<34:25:27, 7.05s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.23, 'learning_rate': 2.5600000000000002e-05, 'epoch': 0.29} + 1%|█ | 258/17840 [26:33<34:25:27, 7.05s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 258/17840 [26:33<34:25:27, 7.05s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [26:40<34:33:40, 7.08s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [26:40<34:33:40, 7.08s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2235, 'learning_rate': 2.57e-05, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:43,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [26:48<34:40:29, 7.10s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [26:48<34:40:29, 7.10s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3889, 'learning_rate': 2.58e-05, 'epoch': 0.29} + 1%|█ | 260/17840 [26:48<34:40:29, 7.10s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [26:48<34:40:29, 7.10s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 261/17840 [26:55<34:34:30, 7.08s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 261/17840 [26:55<34:34:30, 7.08s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3944, 'learning_rate': 2.5900000000000003e-05, 'epoch': 0.29} + 1%|█ | 261/17840 [26:55<34:34:30, 7.08s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:58,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:58,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1359, 'learning_rate': 2.6000000000000002e-05, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:58,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:58,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:58,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [27:08<34:14:38, 7.01s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:09,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:09,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 264/17840 [27:15<34:07:45, 6.99s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 264/17840 [27:15<34:07:45, 6.99s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.229, 'learning_rate': 2.6200000000000003e-05, 'epoch': 0.3} + 1%|█ | 264/17840 [27:15<34:07:45, 6.99s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:19,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:19,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3339, 'learning_rate': 2.6300000000000002e-05, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:19,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:19,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [27:29<34:01:56, 6.97s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [27:29<34:01:56, 6.97s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3954, 'learning_rate': 2.64e-05, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:31,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [27:36<33:50:04, 6.93s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [27:36<33:50:04, 6.93s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2459, 'learning_rate': 2.6500000000000004e-05, 'epoch': 0.3} + 1%|█▏ | 267/17840 [27:36<33:50:04, 6.93s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [27:36<33:50:04, 6.93s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [27:36<33:50:04, 6.93s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [27:43<33:46:50, 6.92s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:43,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:43,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:43,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [27:50<33:31:39, 6.87s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [27:50<33:31:39, 6.87s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [27:50<33:31:39, 6.87s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [27:50<33:31:39, 6.87s/it]g-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:53,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:53,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:53,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:53,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:53,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:56,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [28:03<33:10:07, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [28:03<33:10:07, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [28:03<33:10:07, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [28:03<33:10:07, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [28:10<32:55:30, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 273/17840 [28:16<32:35:08, 6.68s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:17,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:17,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [28:23<32:30:02, 6.66s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [28:23<32:30:02, 6.66s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1669, 'learning_rate': 2.7200000000000004e-05, 'epoch': 0.31} + 2%|█▏ | 274/17840 [28:23<32:30:02, 6.66s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [28:23<32:30:02, 6.66s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [28:23<32:30:02, 6.66s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [28:32<35:52:35, 7.35s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:32,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:32,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:32,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 276/17840 [28:39<34:39:19, 7.10s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:39,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:39,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:39,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 277/17840 [28:45<33:30:44, 6.87s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:45,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:45,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:45,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [28:51<32:39:57, 6.70s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [28:51<32:39:57, 6.70s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:53,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:53,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 279/17840 [28:57<31:58:49, 6.56s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 279/17840 [28:57<31:58:49, 6.56s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:59,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:59,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [29:04<31:37:16, 6.48s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [29:04<31:37:16, 6.48s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:05,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [29:10<31:28:42, 6.45s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [29:10<31:28:42, 6.45s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1678, 'learning_rate': 2.7900000000000004e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:12,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [29:16<30:54:03, 6.34s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [29:16<30:54:03, 6.34s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3188, 'learning_rate': 2.8000000000000003e-05, 'epoch': 0.32} + 2%|█▏ | 282/17840 [29:16<30:54:03, 6.34s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:19,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:19,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0967, 'learning_rate': 2.8100000000000005e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:23,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:23,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [29:28<29:47:38, 6.11s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [29:28<29:47:38, 6.11s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:29,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:29,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 285/17840 [29:34<29:11:41, 5.99s/it]g-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:33,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:33,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:33,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:02,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 286/17840 [29:39<28:40:55, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 286/17840 [29:39<28:40:55, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:42,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:42,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4427, 'learning_rate': 2.8499999999999998e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:46,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:46,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 288/17840 [29:50<27:23:01, 5.62s/it]g-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:50,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:50,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:50,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 289/17840 [29:55<26:39:46, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:56,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:56,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 290/17840 [30:00<25:50:26, 5.30s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:59,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:02,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:02,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:04,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:06,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:06,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:08,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:10,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:10,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:12,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:14,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:14,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:16,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:17,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:17,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:19,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:19,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:22,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:23,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:23,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:26,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:26,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:28,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:28,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:29,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:32,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:32,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8326, 'learning_rate': 2.98e-05, 'epoch': 0.34} +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:36,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:36,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:40,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:40,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1651, 'learning_rate': 2.9900000000000002e-05, 'epoch': 0.34} +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:44,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:44,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:51<26:46:36, 5.50s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:51<26:46:36, 5.50s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2763, 'learning_rate': 3e-05, 'epoch': 0.34} + 2%|█▎ | 302/17840 [30:51<26:46:36, 5.50s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:51<26:46:36, 5.50s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:51<26:46:36, 5.50s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [30:58<29:42:29, 6.10s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:59,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:59,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [31:06<31:32:54, 6.48s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [31:06<31:32:54, 6.48s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3608, 'learning_rate': 3.02e-05, 'epoch': 0.34} + 2%|█▎ | 304/17840 [31:06<31:32:54, 6.48s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [31:06<31:32:54, 6.48s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [31:06<31:32:54, 6.48s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [31:13<32:39:40, 6.71s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [31:13<32:39:40, 6.71s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:15,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:20<33:33:00, 6.89s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:20<33:33:00, 6.89s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2164, 'learning_rate': 3.04e-05, 'epoch': 0.34} + 2%|█▎ | 306/17840 [31:20<33:33:00, 6.89s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:20<33:33:00, 6.89s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [31:27<33:58:03, 6.97s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [31:27<33:58:03, 6.97s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2648, 'learning_rate': 3.05e-05, 'epoch': 0.34} + 2%|█▎ | 307/17840 [31:27<33:58:03, 6.97s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:31,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:31,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3354, 'learning_rate': 3.06e-05, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:31,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:31,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [31:42<34:22:27, 7.06s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [31:42<34:22:27, 7.06s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2717, 'learning_rate': 3.07e-05, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:44,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [31:49<34:26:24, 7.07s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [31:49<34:26:24, 7.07s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3944, 'learning_rate': 3.08e-05, 'epoch': 0.35} + 2%|█▎ | 310/17840 [31:49<34:26:24, 7.07s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [31:49<34:26:24, 7.07s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [31:56<34:23:35, 7.06s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [31:56<34:23:35, 7.06s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:56,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:56,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 312/17840 [32:03<34:14:06, 7.03s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 312/17840 [32:03<34:14:06, 7.03s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.403, 'learning_rate': 3.1e-05, 'epoch': 0.35} + 2%|█▎ | 312/17840 [32:03<34:14:06, 7.03s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:06,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:06,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2895, 'learning_rate': 3.1100000000000004e-05, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:06,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:06,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [32:16<33:54:16, 6.96s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [32:16<33:54:16, 6.96s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:17,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:17,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [32:23<33:43:27, 6.93s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [32:23<33:43:27, 6.93s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1667, 'learning_rate': 3.13e-05, 'epoch': 0.35} + 2%|█▎ | 315/17840 [32:23<33:43:27, 6.93s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [32:23<33:43:27, 6.93s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [32:23<33:43:27, 6.93s/it]g-point operations will not be computed-17 17:10:53,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [32:30<33:35:54, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [32:30<33:35:54, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [32:30<33:35:54, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 317/17840 [32:37<33:29:34, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 317/17840 [32:37<33:29:34, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1964, 'learning_rate': 3.15e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:39,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [32:44<33:21:54, 6.86s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [32:44<33:21:54, 6.86s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2038, 'learning_rate': 3.16e-05, 'epoch': 0.36} + 2%|█▎ | 318/17840 [32:44<33:21:54, 6.86s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:47,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:47,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:47,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:51,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:51,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 320/17840 [32:57<33:01:24, 6.79s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 320/17840 [32:57<33:01:24, 6.79s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2201, 'learning_rate': 3.18e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:59,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 321/17840 [33:04<32:54:55, 6.76s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 321/17840 [33:04<32:54:55, 6.76s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.36, 'learning_rate': 3.19e-05, 'epoch': 0.36} + 2%|█▎ | 321/17840 [33:04<32:54:55, 6.76s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:07,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:07,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2704, 'learning_rate': 3.2000000000000005e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:07,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:07,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:07,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 323/17840 [33:17<32:36:24, 6.70s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:18,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:18,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:18,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [33:24<32:35:45, 6.70s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [33:24<32:35:45, 6.70s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:26,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:26,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [33:33<35:40:23, 7.33s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [33:33<35:40:23, 7.33s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [33:33<35:40:23, 7.33s/it]g-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4044, 'learning_rate': 3.24e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [33:46<33:41:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [33:46<33:41:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [33:46<33:41:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [33:46<33:41:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [33:52<32:48:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [33:58<32:14:29, 6.63s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:59,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:59,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:59,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 330/17840 [34:05<31:52:59, 6.56s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 330/17840 [34:05<31:52:59, 6.56s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:06,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [34:11<31:27:23, 6.47s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [34:11<31:27:23, 6.47s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:11,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:11,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:11,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 332/17840 [34:17<30:57:17, 6.36s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 332/17840 [34:17<30:57:17, 6.36s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:19,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:19,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 333/17840 [34:23<30:31:23, 6.28s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 333/17840 [34:23<30:31:23, 6.28s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:25,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:25,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 334/17840 [34:29<29:55:44, 6.15s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:29,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:29,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:29,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 335/17840 [34:35<29:29:42, 6.07s/it]g-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:35,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:35,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:35,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:44,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [34:41<28:59:59, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [34:41<28:59:59, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:43,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:43,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1603, 'learning_rate': 3.35e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:47,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:47,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 338/17840 [34:52<27:48:06, 5.72s/it]g-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:51,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:51,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:51,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:39,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 339/17840 [34:57<27:09:06, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:15:55,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:58,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:55,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:58,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:55,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 340/17840 [35:02<26:17:56, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 340/17840 [35:02<26:17:56, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:04,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:04,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:06,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:08,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:08,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:11,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:13,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:13,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:15,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:17,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:17,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:18,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:20,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:20,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:22,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:24,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:24,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:26,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:26,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:28,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:30,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:30,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:32,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:32,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:33,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:36,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:36,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6026, 'learning_rate': 3.48e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:40,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:40,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:44,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:44,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2876, 'learning_rate': 3.49e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:44,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:44,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 352/17840 [35:54<27:13:39, 5.60s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 352/17840 [35:54<27:13:39, 5.60s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:55,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:55,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [36:02<29:51:01, 6.15s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [36:02<29:51:01, 6.15s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2859, 'learning_rate': 3.51e-05, 'epoch': 0.4} + 2%|█▌ | 353/17840 [36:02<29:51:01, 6.15s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [36:02<29:51:01, 6.15s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [36:09<31:36:44, 6.51s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [36:09<31:36:44, 6.51s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2586, 'learning_rate': 3.52e-05, 'epoch': 0.4} + 2%|█▌ | 354/17840 [36:09<31:36:44, 6.51s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [36:09<31:36:44, 6.51s/it]g-point operations will not be computed-17 17:16:00,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3954, 'learning_rate': 3.53e-05, 'epoch': 0.4} + 2%|█▌ | 355/17840 [36:16<32:52:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:15,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [36:16<32:52:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:15,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [36:16<32:52:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:15,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [36:24<33:42:30, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:15,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [36:24<33:42:30, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:15,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1234, 'learning_rate': 3.54e-05, 'epoch': 0.4} + 2%|█▌ | 356/17840 [36:24<33:42:30, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:15,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [36:24<33:42:30, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:15,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [36:31<34:10:31, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [36:31<34:10:31, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2875, 'learning_rate': 3.55e-05, 'epoch': 0.4} + 2%|█▌ | 357/17840 [36:31<34:10:31, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [36:38<34:32:35, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [36:38<34:32:35, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2441, 'learning_rate': 3.56e-05, 'epoch': 0.4} + 2%|█▌ | 358/17840 [36:38<34:32:35, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [36:38<34:32:35, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [36:46<34:43:11, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [36:46<34:43:11, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2892, 'learning_rate': 3.57e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:48,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [36:53<34:42:49, 7.15s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [36:53<34:42:49, 7.15s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4134, 'learning_rate': 3.58e-05, 'epoch': 0.4} + 2%|█▌ | 360/17840 [36:53<34:42:49, 7.15s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [36:53<34:42:49, 7.15s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [37:00<34:27:42, 7.10s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [37:00<34:27:42, 7.10s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2588, 'learning_rate': 3.59e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:02,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [37:07<34:11:48, 7.04s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [37:07<34:11:48, 7.04s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.289, 'learning_rate': 3.6e-05, 'epoch': 0.41} + 2%|█▌ | 362/17840 [37:07<34:11:48, 7.04s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:10,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:10,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:14,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:14,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [37:21<34:06:18, 7.03s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [37:21<34:06:18, 7.03s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3809, 'learning_rate': 3.62e-05, 'epoch': 0.41} + 2%|█▌ | 364/17840 [37:21<34:06:18, 7.03s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:24,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:24,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1343, 'learning_rate': 3.63e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:24,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:24,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [37:34<33:45:16, 6.95s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [37:34<33:45:16, 6.95s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:35,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:35,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [37:41<33:25:31, 6.89s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [37:41<33:25:31, 6.89s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2651, 'learning_rate': 3.65e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:43,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [37:48<33:16:21, 6.86s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [37:48<33:16:21, 6.86s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3019, 'learning_rate': 3.66e-05, 'epoch': 0.41} + 2%|█▌ | 368/17840 [37:48<33:16:21, 6.86s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [37:48<33:16:21, 6.86s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [37:55<33:10:09, 6.83s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [37:55<33:10:09, 6.83s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:55,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:55,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [38:01<33:08:20, 6.83s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [38:01<33:08:20, 6.83s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3638, 'learning_rate': 3.68e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:03,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:03,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [38:08<33:02:48, 6.81s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [38:08<33:02:48, 6.81s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [38:08<33:02:48, 6.81s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [38:08<33:02:48, 6.81s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [38:08<33:02:48, 6.81s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [38:15<32:51:22, 6.77s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:15,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:15,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:15,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [38:22<32:36:07, 6.72s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:22,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:22,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:22,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [38:28<32:20:05, 6.66s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [38:28<32:20:05, 6.66s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:30,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [38:37<35:27:17, 7.31s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [38:37<35:27:17, 7.31s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1933, 'learning_rate': 3.73e-05, 'epoch': 0.42} + 2%|█▌ | 375/17840 [38:37<35:27:17, 7.31s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [38:37<35:27:17, 7.31s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [38:37<35:27:17, 7.31s/it]g-point operations will not be computed-17 17:17:30,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [38:43<34:21:48, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [38:43<34:21:48, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [38:43<34:21:48, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [38:43<34:21:48, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 377/17840 [38:50<33:28:03, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:50,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:50,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:50,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [38:56<32:40:23, 6.74s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [38:56<32:40:23, 6.74s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:58,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:58,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 379/17840 [39:03<32:07:47, 6.62s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:03,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:03,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:03,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 380/17840 [39:09<31:30:54, 6.50s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:09,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:09,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:09,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [39:15<31:01:04, 6.40s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [39:15<31:01:04, 6.40s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:16,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:16,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 382/17840 [39:21<30:31:25, 6.29s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 382/17840 [39:21<30:31:25, 6.29s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:23,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:23,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 383/17840 [39:27<30:11:00, 6.22s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:27,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:27,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:27,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 384/17840 [39:33<29:38:17, 6.11s/it]g-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:33,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:33,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:33,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:42,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 385/17840 [39:39<29:10:02, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 385/17840 [39:39<29:10:02, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:41,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:41,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2923, 'learning_rate': 3.8400000000000005e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:41,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:47,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:47,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:37,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 388/17840 [39:55<27:38:26, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:54,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 388/17840 [39:55<27:38:26, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:54,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:58,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:54,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:58,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:54,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2472, 'learning_rate': 3.8700000000000006e-05, 'epoch': 0.44} +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:01,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:54,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:01,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:54,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 390/17840 [40:06<26:15:53, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 390/17840 [40:06<26:15:53, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:08,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:08,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:10,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:12,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:12,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1571, 'learning_rate': 3.9000000000000006e-05, 'epoch': 0.44} +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:15,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:15,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:04,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 393/17840 [40:20<23:25:54, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:18,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:20,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:18,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:20,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:18,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 394/17840 [40:24<22:23:38, 4.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:22,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:23,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:22,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:23,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:22,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 395/17840 [40:27<21:13:51, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:25,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 396/17840 [40:31<19:48:10, 4.09s/it]g-point operations will not be computed-17 17:21:25,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 396/17840 [40:31<19:48:10, 4.09s/it]g-point operations will not be computed-17 17:21:25,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:30,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:29,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:30,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:29,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 397/17840 [40:34<18:16:51, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:32,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 398/17840 [40:37<16:34:41, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 398/17840 [40:37<16:34:41, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 399/17840 [40:39<15:05:01, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:37,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 399/17840 [40:39<15:05:01, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:37,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:38,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:37,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [40:43<16:27:05, 3.40s/it]g-point operations will not be computed-17 17:21:37,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [40:43<16:27:05, 3.40s/it]g-point operations will not be computed-17 17:21:37,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [40:43<16:27:05, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:42,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [40:43<16:27:05, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:42,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:46,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:42,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [40:51<23:01:24, 4.75s/it]g-point operations will not be computed-17 17:21:42,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [40:51<23:01:24, 4.75s/it]g-point operations will not be computed-17 17:21:42,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [40:51<23:01:24, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [40:51<23:01:24, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [40:51<23:01:24, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [40:51<23:01:24, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:58<27:02:04, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:58<27:02:04, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:58<27:02:04, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:03,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:03,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3752, 'learning_rate': 4.0100000000000006e-05, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:03,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:03,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [41:13<31:37:06, 6.53s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [41:13<31:37:06, 6.53s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2762, 'learning_rate': 4.02e-05, 'epoch': 0.45} + 2%|█▋ | 404/17840 [41:13<31:37:06, 6.53s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [41:13<31:37:06, 6.53s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [41:13<31:37:06, 6.53s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [41:21<32:48:19, 6.77s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:21,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:21,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:28<33:28:03, 6.91s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:28<33:28:03, 6.91s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3022, 'learning_rate': 4.0400000000000006e-05, 'epoch': 0.46} + 2%|█▋ | 406/17840 [41:28<33:28:03, 6.91s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:28<33:28:03, 6.91s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:28<33:28:03, 6.91s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:35<33:53:11, 7.00s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:35<33:53:11, 7.00s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:35<33:53:11, 7.00s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:39,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:39,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2039, 'learning_rate': 4.0600000000000004e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:39,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:39,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [41:49<34:23:41, 7.10s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [41:49<34:23:41, 7.10s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.436, 'learning_rate': 4.07e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:52,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [41:57<34:32:17, 7.13s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [41:57<34:32:17, 7.13s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3366, 'learning_rate': 4.08e-05, 'epoch': 0.46} + 2%|█▋ | 410/17840 [41:57<34:32:17, 7.13s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [41:57<34:32:17, 7.13s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [42:04<34:24:44, 7.11s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [42:04<34:24:44, 7.11s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:04,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:04,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [42:11<34:06:16, 7.04s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [42:11<34:06:16, 7.04s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2988, 'learning_rate': 4.1e-05, 'epoch': 0.46} + 2%|█▊ | 412/17840 [42:11<34:06:16, 7.04s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [42:11<34:06:16, 7.04s/it]g-point operations will not be computed-17 17:21:50,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3554, 'learning_rate': 4.11e-05, 'epoch': 0.46} + 2%|█▊ | 413/17840 [42:18<34:01:24, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [42:18<34:01:24, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [42:18<34:01:24, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [42:18<34:01:24, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [42:25<33:55:08, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [42:25<33:55:08, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:27,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:27,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [42:31<33:37:05, 6.95s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [42:31<33:37:05, 6.95s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [42:31<33:37:05, 6.95s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:35,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:35,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4104, 'learning_rate': 4.14e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:35,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:35,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:35,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [42:45<33:20:39, 6.89s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:45,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:45,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 418/17840 [42:52<33:07:55, 6.85s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 418/17840 [42:52<33:07:55, 6.85s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3419, 'learning_rate': 4.16e-05, 'epoch': 0.47} + 2%|█▊ | 418/17840 [42:52<33:07:55, 6.85s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 418/17840 [42:52<33:07:55, 6.85s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 418/17840 [42:52<33:07:55, 6.85s/it]g-point operations will not be computed-17 17:23:16,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [42:59<32:54:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [42:59<32:54:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [42:59<32:54:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [42:59<32:54:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 420/17840 [43:05<32:39:32, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:05,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:05,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:05,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [43:12<32:24:21, 6.70s/it]g-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [43:12<32:24:21, 6.70s/it]g-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:14,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:14,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 422/17840 [43:18<32:17:44, 6.67s/it]g-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 422/17840 [43:18<32:17:44, 6.67s/it]g-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 422/17840 [43:18<32:17:44, 6.67s/it]g-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:22,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:22,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4073, 'learning_rate': 4.21e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:22,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:22,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:22,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 424/17840 [43:32<32:06:28, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 424/17840 [43:32<32:06:28, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 424/17840 [43:32<32:06:28, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 424/17840 [43:32<32:06:28, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [43:40<35:04:14, 7.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:40,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:40,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:40,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 426/17840 [43:47<33:55:01, 7.01s/it]g-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:47,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:47,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [43:53<33:05:55, 6.84s/it]g-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [43:53<33:05:55, 6.84s/it]g-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2875, 'learning_rate': 4.25e-05, 'epoch': 0.48} + 2%|█▊ | 427/17840 [43:53<33:05:55, 6.84s/it]g-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:56,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:56,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.454, 'learning_rate': 4.26e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:56,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:03,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:03,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2717, 'learning_rate': 4.27e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:03,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:09,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:09,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3955, 'learning_rate': 4.2800000000000004e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:09,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:09,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:09,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:30,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [44:18<31:06:21, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:17,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [44:18<31:06:21, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:17,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [44:18<31:06:21, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:17,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [44:18<31:06:21, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:17,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [44:25<30:45:15, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:23,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [44:25<30:45:15, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:23,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [44:25<30:45:15, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:23,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [44:25<30:45:15, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:23,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [44:31<30:33:24, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:29,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [44:31<30:33:24, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:29,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [44:31<30:33:24, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:29,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [44:31<30:33:24, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:29,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [44:37<30:10:41, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:35,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [44:37<30:10:41, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:35,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [44:37<30:10:41, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:35,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [44:37<30:10:41, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:35,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 435/17840 [44:43<29:39:35, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 435/17840 [44:43<29:39:35, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:45,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:45,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4822, 'learning_rate': 4.3400000000000005e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:45,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:51,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:51,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4622, 'learning_rate': 4.35e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:55,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:55,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 438/17840 [45:00<28:00:05, 5.79s/it]g-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:59,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:02,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:02,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2048, 'learning_rate': 4.3700000000000005e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:06,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 440/17840 [45:10<26:47:50, 5.54s/it]g-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 440/17840 [45:10<26:47:50, 5.54s/it]g-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:10,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:12,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:12,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4081, 'learning_rate': 4.39e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:16,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:41,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 442/17840 [45:20<24:51:06, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:18,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 442/17840 [45:20<24:51:06, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:18,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:20,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:18,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 443/17840 [45:24<23:48:34, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:22,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 443/17840 [45:24<23:48:34, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:22,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:24,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:22,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 444/17840 [45:28<22:37:56, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:26,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 444/17840 [45:28<22:37:56, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:26,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:28,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:26,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 445/17840 [45:32<21:21:01, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:30,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 445/17840 [45:32<21:21:01, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:30,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 446/17840 [45:36<19:49:59, 4.10s/it]g-point operations will not be computed-17 17:26:30,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 446/17840 [45:36<19:49:59, 4.10s/it]g-point operations will not be computed-17 17:26:30,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 446/17840 [45:36<19:49:59, 4.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:33,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 447/17840 [45:39<18:15:20, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:36,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 447/17840 [45:39<18:15:20, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:36,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 448/17840 [45:41<16:42:22, 3.46s/it]g-point operations will not be computed-17 17:26:36,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 448/17840 [45:41<16:42:22, 3.46s/it]g-point operations will not be computed-17 17:26:36,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 449/17840 [45:44<15:04:31, 3.12s/it]g-point operations will not be computed-17 17:26:39,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 449/17840 [45:44<15:04:31, 3.12s/it]g-point operations will not be computed-17 17:26:39,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:42,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:41,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 450/17840 [45:48<16:12:13, 3.35s/it]g-point operations will not be computed-17 17:26:41,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 450/17840 [45:48<16:12:13, 3.35s/it]g-point operations will not be computed-17 17:26:41,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 450/17840 [45:48<16:12:13, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:47,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 450/17840 [45:48<16:12:13, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:47,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:50,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:47,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 451/17840 [45:55<22:41:04, 4.70s/it]g-point operations will not be computed-17 17:26:47,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 451/17840 [45:55<22:41:04, 4.70s/it]g-point operations will not be computed-17 17:26:47,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 451/17840 [45:55<22:41:04, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 451/17840 [45:55<22:41:04, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 451/17840 [45:55<22:41:04, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [46:03<26:44:40, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [46:03<26:44:40, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2825, 'learning_rate': 4.5e-05, 'epoch': 0.51} + 3%|█▉ | 452/17840 [46:03<26:44:40, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [46:03<26:44:40, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 453/17840 [46:10<29:29:50, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 453/17840 [46:10<29:29:50, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:11,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:11,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [46:18<31:15:29, 6.47s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [46:18<31:15:29, 6.47s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1538, 'learning_rate': 4.52e-05, 'epoch': 0.51} + 3%|█▉ | 454/17840 [46:18<31:15:29, 6.47s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [46:18<31:15:29, 6.47s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [46:25<32:22:06, 6.70s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [46:25<32:22:06, 6.70s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4325, 'learning_rate': 4.53e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:27,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:27,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [46:32<33:18:04, 6.90s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [46:32<33:18:04, 6.90s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [46:32<33:18:04, 6.90s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [46:32<33:18:04, 6.90s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [46:32<33:18:04, 6.90s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:40<33:46:33, 6.99s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:40<33:46:33, 6.99s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:40<33:46:33, 6.99s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:44,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:44,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2846, 'learning_rate': 4.5600000000000004e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:44,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:44,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:44,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:54<34:23:12, 7.12s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:54<34:23:12, 7.12s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:54<34:23:12, 7.12s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:58,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:58,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4657, 'learning_rate': 4.58e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:58,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:58,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:58,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [47:08<34:10:41, 7.08s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [47:08<34:10:41, 7.08s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [47:08<34:10:41, 7.08s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:12,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:12,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.267, 'learning_rate': 4.600000000000001e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:12,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:12,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:12,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [47:22<34:07:31, 7.07s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [47:22<34:07:31, 7.07s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:24,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [47:29<34:02:11, 7.05s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [47:29<34:02:11, 7.05s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2249, 'learning_rate': 4.6200000000000005e-05, 'epoch': 0.52} + 3%|█▉ | 464/17840 [47:29<34:02:11, 7.05s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [47:29<34:02:11, 7.05s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [47:29<34:02:11, 7.05s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 465/17840 [47:36<33:46:34, 7.00s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:37,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:37,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:37,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [47:43<33:38:38, 6.97s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [47:43<33:38:38, 6.97s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [47:43<33:38:38, 6.97s/it]g-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:47,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:47,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2756, 'learning_rate': 4.6500000000000005e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:47,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:47,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:47,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:54,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [47:57<33:16:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [47:57<33:16:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [47:57<33:16:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [47:57<33:16:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [48:03<33:09:03, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [48:03<33:09:03, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [48:03<33:09:03, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:07,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:07,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3483, 'learning_rate': 4.6800000000000006e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:07,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:07,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:07,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:55,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [48:17<32:34:15, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [48:17<32:34:15, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [48:17<32:34:15, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [48:17<32:34:15, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [48:24<32:32:22, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:24,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:24,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [48:30<32:21:39, 6.71s/it]g-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [48:30<32:21:39, 6.71s/it]g-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6241, 'learning_rate': 4.71e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:32,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [48:37<32:05:31, 6.65s/it]g-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [48:37<32:05:31, 6.65s/it]g-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.392, 'learning_rate': 4.72e-05, 'epoch': 0.53} + 3%|██ | 474/17840 [48:37<32:05:31, 6.65s/it]g-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [48:37<32:05:31, 6.65s/it]g-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [48:37<32:05:31, 6.65s/it]g-point operations will not be computed-17 17:29:15,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [48:46<35:15:55, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [48:46<35:15:55, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [48:46<35:15:55, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [48:46<35:15:55, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [48:52<34:09:47, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [48:52<34:09:47, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:54,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:54,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [48:58<33:08:32, 6.87s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [48:58<33:08:32, 6.87s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:00,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [49:05<32:23:26, 6.72s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [49:05<32:23:26, 6.72s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1896, 'learning_rate': 4.76e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:06,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 479/17840 [49:11<31:42:53, 6.58s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 479/17840 [49:11<31:42:53, 6.58s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.14, 'learning_rate': 4.77e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:13,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [49:17<31:13:01, 6.47s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [49:17<31:13:01, 6.47s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3633, 'learning_rate': 4.78e-05, 'epoch': 0.54} + 3%|██ | 480/17840 [49:17<31:13:01, 6.47s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [49:17<31:13:01, 6.47s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [49:17<31:13:01, 6.47s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [49:24<31:34:34, 6.55s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [49:24<31:34:34, 6.55s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:27,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 482/17840 [49:32<33:39:37, 6.98s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 482/17840 [49:32<33:39:37, 6.98s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2659, 'learning_rate': 4.8e-05, 'epoch': 0.54} + 3%|██ | 482/17840 [49:32<33:39:37, 6.98s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 482/17840 [49:32<33:39:37, 6.98s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 483/17840 [49:39<33:47:56, 7.01s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 483/17840 [49:39<33:47:56, 7.01s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:39,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:39,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 484/17840 [49:45<32:30:00, 6.74s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 484/17840 [49:45<32:30:00, 6.74s/it]g-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:45,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:45,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:29:44,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 485/17840 [49:51<31:07:25, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 485/17840 [49:51<31:07:25, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4805, 'learning_rate': 4.83e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:54,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:54,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2154, 'learning_rate': 4.8400000000000004e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:58,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 487/17840 [50:02<29:08:18, 6.04s/it]g-point operations will not be computed-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 487/17840 [50:02<29:08:18, 6.04s/it]g-point operations will not be computed-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1028, 'learning_rate': 4.85e-05, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:03,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 488/17840 [50:08<28:09:09, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:06,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 488/17840 [50:08<28:09:09, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:06,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2417, 'learning_rate': 4.86e-05, 'epoch': 0.55} + 3%|██ | 488/17840 [50:08<28:09:09, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:06,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:10,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:06,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:10,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:06,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:14,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:06,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:14,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:06,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 490/17840 [50:18<26:16:06, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:18,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:18,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 491/17840 [50:22<25:07:07, 5.21s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:22,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:22,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:24,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:26,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:26,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:28,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:30,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:30,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:32,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:33,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:33,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:35,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:38,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:38,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:40,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:40,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:41,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:41,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:44,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:44,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:46,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:47,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:47,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:50,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:50,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:54,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:54,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:54,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:58,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:58,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:02,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:02,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:02,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [51:08<26:42:05, 5.54s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [51:08<26:42:05, 5.54s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [51:08<26:42:05, 5.54s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [51:08<26:42:05, 5.54s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [51:08<26:42:05, 5.54s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 503/17840 [51:16<29:29:24, 6.12s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:17,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:17,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:17,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:23<31:10:31, 6.47s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:23<31:10:31, 6.47s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:23<31:10:31, 6.47s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:23<31:10:31, 6.47s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:23<31:10:31, 6.47s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [51:31<32:21:59, 6.72s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [51:31<32:21:59, 6.72s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:33,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:38<33:14:14, 6.90s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:38<33:14:14, 6.90s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3601, 'learning_rate': 5.0400000000000005e-05, 'epoch': 0.57} + 3%|██▏ | 506/17840 [51:38<33:14:14, 6.90s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:38<33:14:14, 6.90s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:38<33:14:14, 6.90s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [51:45<33:47:18, 7.02s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [51:45<33:47:18, 7.02s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [51:45<33:47:18, 7.02s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:49,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:49,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4161, 'learning_rate': 5.0600000000000003e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:49,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:49,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:49,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [52:00<34:11:06, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [52:00<34:11:06, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [52:00<34:11:06, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:04,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:04,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3779, 'learning_rate': 5.08e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:04,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:04,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:04,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [52:14<34:15:17, 7.12s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [52:14<34:15:17, 7.12s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:16,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:21<34:09:33, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:21<34:09:33, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3924, 'learning_rate': 5.1000000000000006e-05, 'epoch': 0.57} + 3%|██▏ | 512/17840 [52:21<34:09:33, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:21<34:09:33, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:21<34:09:33, 7.10s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [52:28<33:59:42, 7.06s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [52:28<33:59:42, 7.06s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:30,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [52:35<33:55:44, 7.05s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [52:35<33:55:44, 7.05s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2497, 'learning_rate': 5.1200000000000004e-05, 'epoch': 0.58} + 3%|██▏ | 514/17840 [52:35<33:55:44, 7.05s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [52:35<33:55:44, 7.05s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [52:35<33:55:44, 7.05s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [52:42<33:46:05, 7.02s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:42,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:42,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:42,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [52:49<33:33:55, 6.98s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [52:49<33:33:55, 6.98s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [52:49<33:33:55, 6.98s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:52,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:52,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4582, 'learning_rate': 5.1500000000000005e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:52,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:52,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:52,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [53:02<33:17:50, 6.92s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:03,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:03,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [53:09<33:08:24, 6.89s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [53:09<33:08:24, 6.89s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4215, 'learning_rate': 5.17e-05, 'epoch': 0.58} + 3%|██▏ | 519/17840 [53:09<33:08:24, 6.89s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [53:09<33:08:24, 6.89s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [53:09<33:08:24, 6.89s/it]g-point operations will not be computed-17 17:31:16,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [53:16<32:55:00, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [53:16<32:55:00, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [53:16<32:55:00, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [53:16<32:55:00, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [53:23<32:46:16, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:23,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:23,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [53:29<32:26:49, 6.74s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [53:29<32:26:49, 6.74s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2311, 'learning_rate': 5.2000000000000004e-05, 'epoch': 0.59} + 3%|██▏ | 522/17840 [53:29<32:26:49, 6.74s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:33,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:33,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2368, 'learning_rate': 5.2100000000000006e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:33,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:39,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:39,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3391, 'learning_rate': 5.22e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:39,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:39,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:39,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [53:51<35:15:33, 7.33s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:52,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:52,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 526/17840 [53:58<33:58:37, 7.06s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 526/17840 [53:58<33:58:37, 7.06s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:58,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:58,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [54:04<33:00:02, 6.86s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [54:04<33:00:02, 6.86s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3668, 'learning_rate': 5.25e-05, 'epoch': 0.59} + 3%|██▏ | 527/17840 [54:04<33:00:02, 6.86s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:08,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:08,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3099, 'learning_rate': 5.2600000000000005e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:08,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:14,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:14,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2852, 'learning_rate': 5.270000000000001e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:14,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:20,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:20,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5686, 'learning_rate': 5.28e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:20,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:26,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:26,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4915, 'learning_rate': 5.2900000000000005e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:26,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:32,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:32,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0933, 'learning_rate': 5.300000000000001e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:32,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3256, 'learning_rate': 5.31e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:43,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 534/17840 [54:47<29:24:28, 6.12s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 534/17840 [54:47<29:24:28, 6.12s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1984, 'learning_rate': 5.3200000000000006e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:49,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 535/17840 [54:53<28:58:46, 6.03s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 535/17840 [54:53<28:58:46, 6.03s/it]g-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:53,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:53,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:15,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 536/17840 [54:59<28:39:06, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:57,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 536/17840 [54:59<28:39:06, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:57,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3519, 'learning_rate': 5.3400000000000004e-05, 'epoch': 0.6} + 3%|██▎ | 536/17840 [54:59<28:39:06, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:57,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 536/17840 [54:59<28:39:06, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:57,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [55:05<28:11:48, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:03,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:06,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:03,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 538/17840 [55:10<27:35:37, 5.74s/it]g-point operations will not be computed-17 17:36:03,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 538/17840 [55:10<27:35:37, 5.74s/it]g-point operations will not be computed-17 17:36:03,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:10,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:03,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:10,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:03,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 539/17840 [55:15<26:49:57, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 539/17840 [55:15<26:49:57, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:16,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 540/17840 [55:20<25:43:42, 5.35s/it]g-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 540/17840 [55:20<25:43:42, 5.35s/it]g-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:19,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:22,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:22,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:22,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:25,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:14,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 542/17840 [55:29<23:23:41, 4.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:27,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 542/17840 [55:29<23:23:41, 4.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:27,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 543/17840 [55:33<22:08:18, 4.61s/it]g-point operations will not be computed-17 17:36:27,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 543/17840 [55:33<22:08:18, 4.61s/it]g-point operations will not be computed-17 17:36:27,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 543/17840 [55:33<22:08:18, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:31,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 543/17840 [55:33<22:08:18, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:31,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 544/17840 [55:37<20:44:56, 4.32s/it]g-point operations will not be computed-17 17:36:31,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 544/17840 [55:37<20:44:56, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:34,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 544/17840 [55:37<20:44:56, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:34,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 545/17840 [55:40<19:13:27, 4.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:38,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 545/17840 [55:40<19:13:27, 4.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:38,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 546/17840 [55:43<17:51:09, 3.72s/it]g-point operations will not be computed-17 17:36:38,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 546/17840 [55:43<17:51:09, 3.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:41,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 546/17840 [55:43<17:51:09, 3.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:41,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 547/17840 [55:46<16:27:41, 3.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:43,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 547/17840 [55:46<16:27:41, 3.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:43,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 548/17840 [55:48<15:14:19, 3.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:46,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 548/17840 [55:48<15:14:19, 3.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:46,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 549/17840 [55:51<13:57:59, 2.91s/it]g-point operations will not be computed-17 17:36:46,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:49,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:48,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:49,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:48,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [55:55<15:35:47, 3.25s/it]g-point operations will not be computed-17 17:36:48,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [55:55<15:35:47, 3.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:54,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [55:55<15:35:47, 3.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:54,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:57,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:54,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:57,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:54,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [56:02<22:08:32, 4.61s/it]g-point operations will not be computed-17 17:36:54,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [56:02<22:08:32, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [56:02<22:08:32, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:05,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:05,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [56:10<26:22:28, 5.49s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [56:10<26:22:28, 5.49s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [56:10<26:22:28, 5.49s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:14,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:14,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4411, 'learning_rate': 5.5100000000000004e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:14,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:14,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:14,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [56:25<31:02:49, 6.47s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [56:25<31:02:49, 6.47s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [56:25<31:02:49, 6.47s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [56:25<31:02:49, 6.47s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [56:25<31:02:49, 6.47s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [56:32<32:13:53, 6.71s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [56:32<32:13:53, 6.71s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:39<33:06:39, 6.90s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:39<33:06:39, 6.90s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3281, 'learning_rate': 5.5400000000000005e-05, 'epoch': 0.62} + 3%|██▎ | 556/17840 [56:39<33:06:39, 6.90s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:39<33:06:39, 6.90s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:39<33:06:39, 6.90s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:47<33:31:54, 6.98s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:47<33:31:54, 6.98s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:47<33:31:54, 6.98s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:51,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:51,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2692, 'learning_rate': 5.560000000000001e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:51,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:51,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:51,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [57:01<34:01:21, 7.09s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [57:01<34:01:21, 7.09s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [57:01<34:01:21, 7.09s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:05,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:05,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2145, 'learning_rate': 5.580000000000001e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:05,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:05,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:05,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 561/17840 [57:15<33:55:28, 7.07s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 561/17840 [57:15<33:55:28, 7.07s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:17,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 562/17840 [57:22<33:44:42, 7.03s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 562/17840 [57:22<33:44:42, 7.03s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2501, 'learning_rate': 5.6000000000000006e-05, 'epoch': 0.63} + 3%|██▍ | 562/17840 [57:22<33:44:42, 7.03s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 562/17840 [57:22<33:44:42, 7.03s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 562/17840 [57:22<33:44:42, 7.03s/it]g-point operations will not be computed-17 17:37:01,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [57:29<33:28:34, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [57:29<33:28:34, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [57:29<33:28:34, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [57:29<33:28:34, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [57:36<33:17:33, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [57:36<33:17:33, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [57:36<33:17:33, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [57:36<33:17:33, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [57:36<33:17:33, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:28,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [57:43<33:13:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [57:43<33:13:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [57:43<33:13:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [57:43<33:13:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [57:50<33:11:29, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:50,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:50,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [57:56<33:00:13, 6.88s/it]g-point operations will not be computed-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [57:56<33:00:13, 6.88s/it]g-point operations will not be computed-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2872, 'learning_rate': 5.65e-05, 'epoch': 0.64} + 3%|██▍ | 567/17840 [57:56<33:00:13, 6.88s/it]g-point operations will not be computed-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [57:56<33:00:13, 6.88s/it]g-point operations will not be computed-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [57:56<33:00:13, 6.88s/it]g-point operations will not be computed-17 17:38:41,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [58:03<32:56:27, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [58:03<32:56:27, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [58:03<32:56:27, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [58:03<32:56:27, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 569/17840 [58:10<32:49:47, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 569/17840 [58:10<32:49:47, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:12,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 570/17840 [58:17<32:42:52, 6.82s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 570/17840 [58:17<32:42:52, 6.82s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3159, 'learning_rate': 5.68e-05, 'epoch': 0.64} + 3%|██▍ | 570/17840 [58:17<32:42:52, 6.82s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:20,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:20,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.27, 'learning_rate': 5.69e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:20,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:20,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:20,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 572/17840 [58:30<32:11:45, 6.71s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:30,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:30,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:30,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [58:36<31:54:35, 6.65s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [58:36<31:54:35, 6.65s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:38,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 574/17840 [58:43<31:44:25, 6.62s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 574/17840 [58:43<31:44:25, 6.62s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1508, 'learning_rate': 5.72e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:45,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [58:52<34:57:55, 7.29s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [58:52<34:57:55, 7.29s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4685, 'learning_rate': 5.73e-05, 'epoch': 0.64} + 3%|██▍ | 575/17840 [58:52<34:57:55, 7.29s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:55,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:55,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2282, 'learning_rate': 5.74e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:55,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:55,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:55,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [59:05<32:54:10, 6.86s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:05,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:05,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [59:11<32:11:07, 6.71s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [59:11<32:11:07, 6.71s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:11,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:11,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [59:17<31:37:03, 6.59s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [59:17<31:37:03, 6.59s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9641, 'learning_rate': 5.77e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:19,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [59:24<31:08:34, 6.50s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [59:24<31:08:34, 6.50s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5745, 'learning_rate': 5.7799999999999995e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:25,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [59:30<30:49:04, 6.43s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [59:30<30:49:04, 6.43s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4293, 'learning_rate': 5.79e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:32,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 582/17840 [59:36<30:26:34, 6.35s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 582/17840 [59:36<30:26:34, 6.35s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:36,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:36,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 583/17840 [59:42<30:00:57, 6.26s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 583/17840 [59:42<30:00:57, 6.26s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3589, 'learning_rate': 5.8099999999999996e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:44,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 584/17840 [59:48<29:33:40, 6.17s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 584/17840 [59:48<29:33:40, 6.17s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3944, 'learning_rate': 5.82e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:49,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 585/17840 [59:54<29:01:11, 6.05s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 585/17840 [59:54<29:01:11, 6.05s/it]g-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:54,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:54,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:54,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:02,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 586/17840 [1:00:00<28:36:29, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 586/17840 [1:00:00<28:36:29, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:02,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:02,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4551, 'learning_rate': 5.85e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:02,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:08,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:08,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4496, 'learning_rate': 5.86e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:12,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 589/17840 [1:00:16<26:59:44, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:41:14,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 589/17840 [1:00:16<26:59:44, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:41:14,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2495, 'learning_rate': 5.87e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:18,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:14,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:18,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:14,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3133, 'learning_rate': 5.88e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:22,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:14,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 591/17840 [1:00:26<25:39:36, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 591/17840 [1:00:26<25:39:36, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3497, 'learning_rate': 5.89e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:28,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:28,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:30,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:32,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:32,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:35,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:37,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:37,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:39,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:40,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:40,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:42,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:44,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:44,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:47,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:47,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:48,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:48,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:51,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:53,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:53,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7379, 'learning_rate': 5.97e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:56,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:56,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3418, 'learning_rate': 5.9800000000000003e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:00,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:00,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:04,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:04,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3965, 'learning_rate': 5.99e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:04,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:11,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:11,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.317, 'learning_rate': 6e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:11,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:11,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [1:01:22<29:22:23, 6.13s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [1:01:22<29:22:23, 6.13s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3624, 'learning_rate': 6.0100000000000004e-05, 'epoch': 0.68} + 3%|██▌ | 603/17840 [1:01:22<29:22:23, 6.13s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [1:01:22<29:22:23, 6.13s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [1:01:29<31:10:59, 6.51s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [1:01:29<31:10:59, 6.51s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3104, 'learning_rate': 6.02e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:32,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [1:01:36<32:14:46, 6.74s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [1:01:36<32:14:46, 6.74s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3823, 'learning_rate': 6.03e-05, 'epoch': 0.68} + 3%|██▌ | 605/17840 [1:01:36<32:14:46, 6.74s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [1:01:36<32:14:46, 6.74s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [1:01:44<33:01:02, 6.90s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [1:01:44<33:01:02, 6.90s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.305, 'learning_rate': 6.04e-05, 'epoch': 0.68} + 3%|██▌ | 606/17840 [1:01:44<33:01:02, 6.90s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [1:01:44<33:01:02, 6.90s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [1:01:44<33:01:02, 6.90s/it]g-point operations will not be computed-17 17:41:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 607/17840 [1:01:51<33:29:02, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 607/17840 [1:01:51<33:29:02, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 607/17840 [1:01:51<33:29:02, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [1:01:58<33:43:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [1:01:58<33:43:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3285, 'learning_rate': 6.06e-05, 'epoch': 0.68} + 3%|██▌ | 608/17840 [1:01:58<33:43:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [1:01:58<33:43:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [1:01:58<33:43:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [1:02:05<33:55:58, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:06,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:06,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 610/17840 [1:02:12<33:48:38, 7.06s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 610/17840 [1:02:12<33:48:38, 7.06s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2968, 'learning_rate': 6.08e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:14,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [1:02:19<33:39:48, 7.03s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [1:02:19<33:39:48, 7.03s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.275, 'learning_rate': 6.09e-05, 'epoch': 0.68} + 3%|██▌ | 611/17840 [1:02:19<33:39:48, 7.03s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [1:02:19<33:39:48, 7.03s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:02:26<33:34:56, 7.02s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:02:26<33:34:56, 7.02s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.526, 'learning_rate': 6.1e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:28,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:02:33<33:27:18, 6.99s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:02:33<33:27:18, 6.99s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3724, 'learning_rate': 6.110000000000001e-05, 'epoch': 0.69} + 3%|██▌ | 613/17840 [1:02:33<33:27:18, 6.99s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:02:33<33:27:18, 6.99s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:02:33<33:27:18, 6.99s/it]g-point operations will not be computed-17 17:42:50,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [1:02:40<33:17:19, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [1:02:40<33:17:19, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [1:02:40<33:17:19, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 615/17840 [1:02:47<33:08:30, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 615/17840 [1:02:47<33:08:30, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3573, 'learning_rate': 6.13e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:49,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:49,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:02:54<32:54:36, 6.88s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:02:54<32:54:36, 6.88s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:02:54<32:54:36, 6.88s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:57,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:57,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:57,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3055, 'learning_rate': 6.15e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:57,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 618/17840 [1:03:07<32:23:12, 6.77s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 618/17840 [1:03:07<32:23:12, 6.77s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:07,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:07,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:07,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 619/17840 [1:03:14<32:18:13, 6.75s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 619/17840 [1:03:14<32:18:13, 6.75s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:16,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:16,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:03:20<32:15:34, 6.74s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:03:20<32:15:34, 6.74s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:03:20<32:15:34, 6.74s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:24,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:24,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:24,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:27,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:27,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:03:34<31:58:34, 6.69s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:03:34<31:58:34, 6.69s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2056, 'learning_rate': 6.2e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:36,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:36,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:03:40<31:48:55, 6.65s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:03:40<31:48:55, 6.65s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:03:40<31:48:55, 6.65s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:03:40<31:48:55, 6.65s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:44,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:44,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:44,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:44,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:44,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 625/17840 [1:03:56<34:59:06, 7.32s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 626/17840 [1:04:02<33:52:19, 7.08s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:02,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:02,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:02,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:04:09<32:59:39, 6.90s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:04:09<32:59:39, 6.90s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:04:09<32:59:39, 6.90s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:04:09<32:59:39, 6.90s/it]g-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:12,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:12,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:12,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:18,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:18,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3205, 'learning_rate': 6.27e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:18,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:18,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:18,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:39,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:04:28<31:20:57, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:26,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:04:28<31:20:57, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:26,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:04:28<31:20:57, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:26,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:04:28<31:20:57, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:26,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:04:34<30:57:20, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:04:34<30:57:20, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:04:34<30:57:20, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:04:34<30:57:20, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 632/17840 [1:04:40<30:28:31, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:39,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 632/17840 [1:04:40<30:28:31, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:39,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 632/17840 [1:04:40<30:28:31, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:39,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 632/17840 [1:04:40<30:28:31, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:39,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:04:46<30:08:32, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:45,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:04:46<30:08:32, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:45,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:49,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:45,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:49,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:45,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3196, 'learning_rate': 6.32e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:49,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:45,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:49,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:45,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:49,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:45,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 635/17840 [1:04:59<29:29:49, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 635/17840 [1:04:59<29:29:49, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:01,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:01,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4583, 'learning_rate': 6.340000000000001e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:01,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:07,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:07,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4623, 'learning_rate': 6.35e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:11,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:11,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 638/17840 [1:05:16<28:05:29, 5.88s/it]g-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:16,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:16,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:16,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:57,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 639/17840 [1:05:21<27:28:01, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:46:20,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 639/17840 [1:05:21<27:28:01, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:46:20,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:23,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:20,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:23,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:20,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:26,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:20,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:26,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:20,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:26,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:20,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 641/17840 [1:05:32<25:57:09, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:32,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 642/17840 [1:05:36<24:58:26, 5.23s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 642/17840 [1:05:36<24:58:26, 5.23s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:35,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:38,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:38,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:40,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:42,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:42,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:44,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:45,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:45,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:47,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:47,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:50,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:52,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:52,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:54,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:54,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:56,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:56,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:58,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:58,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:01,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:01,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3744, 'learning_rate': 6.48e-05, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:06,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:06,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:09,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:09,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5348, 'learning_rate': 6.49e-05, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:09,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:09,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:09,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 652/17840 [1:06:20<27:01:14, 5.66s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:21,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:21,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:06:28<29:34:37, 6.20s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:06:28<29:34:37, 6.20s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4836, 'learning_rate': 6.510000000000001e-05, 'epoch': 0.73} + 4%|██▋ | 653/17840 [1:06:28<29:34:37, 6.20s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:06:28<29:34:37, 6.20s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:06:35<31:20:25, 6.56s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:06:35<31:20:25, 6.56s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5313, 'learning_rate': 6.52e-05, 'epoch': 0.73} + 4%|██▋ | 654/17840 [1:06:35<31:20:25, 6.56s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:39,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:39,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4241, 'learning_rate': 6.53e-05, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:39,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:39,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:06:50<33:04:48, 6.93s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:06:50<33:04:48, 6.93s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3432, 'learning_rate': 6.54e-05, 'epoch': 0.74} + 4%|██▋ | 656/17840 [1:06:50<33:04:48, 6.93s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:54,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:54,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.378, 'learning_rate': 6.55e-05, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:54,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:54,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:54,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:07:04<33:51:25, 7.09s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:07:04<33:51:25, 7.09s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:07:04<33:51:25, 7.09s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:07:04<33:51:25, 7.09s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:07:04<33:51:25, 7.09s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:07:11<34:04:49, 7.14s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:07:11<34:04:49, 7.14s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:14,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:14,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:07:18<34:04:01, 7.14s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:07:18<34:04:01, 7.14s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:07:18<34:04:01, 7.14s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:07:18<34:04:01, 7.14s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:07:18<34:04:01, 7.14s/it]g-point operations will not be computed-17 17:46:30,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:07:25<33:54:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:07:25<33:54:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:07:25<33:54:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:07:25<33:54:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:32<33:48:22, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:32<33:48:22, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:32<33:48:22, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:32<33:48:22, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:32<33:48:22, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 663/17840 [1:07:39<33:37:32, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:40,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:40,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:40,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 664/17840 [1:07:46<33:23:42, 7.00s/it]g-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 664/17840 [1:07:46<33:23:42, 7.00s/it]g-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:48,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:07:53<33:10:41, 6.95s/it]g-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:07:53<33:10:41, 6.95s/it]g-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2954, 'learning_rate': 6.630000000000001e-05, 'epoch': 0.75} + 4%|██▊ | 665/17840 [1:07:53<33:10:41, 6.95s/it]g-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:07:53<33:10:41, 6.95s/it]g-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:07:53<33:10:41, 6.95s/it]g-point operations will not be computed-17 17:48:24,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:08:00<32:56:08, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:08:00<32:56:08, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:08:00<32:56:08, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:08:00<32:56:08, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 667/17840 [1:08:07<32:53:33, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 667/17840 [1:08:07<32:53:33, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:09,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 668/17840 [1:08:14<32:42:11, 6.86s/it]g-point operations will not be computed-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 668/17840 [1:08:14<32:42:11, 6.86s/it]g-point operations will not be computed-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4404, 'learning_rate': 6.66e-05, 'epoch': 0.75} + 4%|██▊ | 668/17840 [1:08:14<32:42:11, 6.86s/it]g-point operations will not be computed-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 668/17840 [1:08:14<32:42:11, 6.86s/it]g-point operations will not be computed-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 668/17840 [1:08:14<32:42:11, 6.86s/it]g-point operations will not be computed-17 17:48:59,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:08:20<32:32:53, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:08:20<32:32:53, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:08:20<32:32:53, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:08:20<32:32:53, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [1:08:27<32:21:54, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:27,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:27,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:08:34<32:13:03, 6.76s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:08:34<32:13:03, 6.76s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2566, 'learning_rate': 6.690000000000001e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:36,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 672/17840 [1:08:40<31:54:17, 6.69s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 672/17840 [1:08:40<31:54:17, 6.69s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3261, 'learning_rate': 6.7e-05, 'epoch': 0.75} + 4%|██▊ | 672/17840 [1:08:40<31:54:17, 6.69s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:44,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:44,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.197, 'learning_rate': 6.71e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:44,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:44,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:44,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:08:53<31:35:12, 6.62s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:54,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:54,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:09:02<34:31:19, 7.24s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:09:02<34:31:19, 7.24s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1982, 'learning_rate': 6.730000000000001e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:04,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 676/17840 [1:09:09<33:28:03, 7.02s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 676/17840 [1:09:09<33:28:03, 7.02s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5111, 'learning_rate': 6.740000000000001e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:10,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 677/17840 [1:09:15<32:37:48, 6.84s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 677/17840 [1:09:15<32:37:48, 6.84s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1875, 'learning_rate': 6.750000000000001e-05, 'epoch': 0.76} + 4%|██▊ | 677/17840 [1:09:15<32:37:48, 6.84s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:18,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:18,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0942, 'learning_rate': 6.76e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:18,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:25,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:25,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2466, 'learning_rate': 6.77e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:25,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:31,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:31,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3476, 'learning_rate': 6.780000000000001e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:31,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:31,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:31,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:09:40<30:24:10, 6.38s/it]g-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:40,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:40,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:40,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:46<30:05:43, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:45,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:46<30:05:43, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:45,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:46<30:05:43, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:45,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:46<30:05:43, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:45,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 683/17840 [1:09:52<29:51:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:51,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 683/17840 [1:09:52<29:51:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:51,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 683/17840 [1:09:52<29:51:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:51,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 683/17840 [1:09:52<29:51:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:51,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 684/17840 [1:09:58<29:33:14, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 684/17840 [1:09:58<29:33:14, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:01,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:01,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4912, 'learning_rate': 6.83e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:01,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:07,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:07,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3143, 'learning_rate': 6.840000000000001e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:11,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:10:16<28:07:11, 5.90s/it]g-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:10:16<28:07:11, 5.90s/it]g-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:16,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:16,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 688/17840 [1:10:21<27:51:10, 5.85s/it]g-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 688/17840 [1:10:21<27:51:10, 5.85s/it]g-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:21,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:24,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:24,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5293, 'learning_rate': 6.87e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:28,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 690/17840 [1:10:32<26:28:47, 5.56s/it]g-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 690/17840 [1:10:32<26:28:47, 5.56s/it]g-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:32,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:32,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:32,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:57,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 691/17840 [1:10:37<25:46:26, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:35,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:38,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:35,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 692/17840 [1:10:42<24:47:29, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:40,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 692/17840 [1:10:42<24:47:29, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:40,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:42,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:40,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 693/17840 [1:10:46<23:30:32, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:44,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 693/17840 [1:10:46<23:30:32, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:44,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:46,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:44,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 694/17840 [1:10:50<22:05:07, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:48,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 694/17840 [1:10:50<22:05:07, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:48,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:50,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:48,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 695/17840 [1:10:54<20:36:37, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:52,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 695/17840 [1:10:54<20:36:37, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:52,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 696/17840 [1:10:57<19:05:24, 4.01s/it]g-point operations will not be computed-17 17:51:52,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 696/17840 [1:10:57<19:05:24, 4.01s/it]g-point operations will not be computed-17 17:51:52,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:56,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:55,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 697/17840 [1:11:00<17:43:45, 3.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:58,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 697/17840 [1:11:00<17:43:45, 3.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:58,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 698/17840 [1:11:03<16:09:46, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:00,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 698/17840 [1:11:03<16:09:46, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:00,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.43, 'learning_rate': 6.96e-05, 'epoch': 0.78} + 4%|██▉ | 699/17840 [1:11:05<14:40:39, 3.08s/it]g-point operations will not be computed-17 17:52:00,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:04,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:03,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:11:09<16:03:13, 3.37s/it]g-point operations will not be computed-17 17:52:03,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:11:09<16:03:13, 3.37s/it]g-point operations will not be computed-17 17:52:03,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:11:09<16:03:13, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:08,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:11:09<16:03:13, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:08,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:12,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:08,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:12,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:08,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:11:17<22:24:25, 4.71s/it]g-point operations will not be computed-17 17:52:08,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:11:17<22:24:25, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:11:17<22:24:25, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:11:17<22:24:25, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:11:17<22:24:25, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:11:24<26:23:36, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:11:24<26:23:36, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:11:24<26:23:36, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:29,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:29,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2046, 'learning_rate': 7.01e-05, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:29,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:29,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:29,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:39<30:36:17, 6.43s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:39<30:36:17, 6.43s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:39<30:36:17, 6.43s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:39<30:36:17, 6.43s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:39<30:36:17, 6.43s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:11:46<31:49:18, 6.69s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:47,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:47,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:47,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:11:53<32:32:49, 6.84s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:11:53<32:32:49, 6.84s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:11:53<32:32:49, 6.84s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:11:53<32:32:49, 6.84s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:11:53<32:32:49, 6.84s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:12:01<33:09:37, 6.97s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:01,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:01,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:12:08<33:26:52, 7.03s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:12:08<33:26:52, 7.03s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5083, 'learning_rate': 7.06e-05, 'epoch': 0.79} + 4%|██▉ | 708/17840 [1:12:08<33:26:52, 7.03s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:12:08<33:26:52, 7.03s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:12:08<33:26:52, 7.03s/it]g-point operations will not be computed-17 17:52:16,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:12:15<33:36:32, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:14,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:12:15<33:36:32, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:14,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:12:15<33:36:32, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:14,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 710/17840 [1:12:22<33:39:19, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:14,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 710/17840 [1:12:22<33:39:19, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:14,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5161, 'learning_rate': 7.08e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:24,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:14,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:24,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:14,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:12:29<33:23:58, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:12:29<33:23:58, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:12:29<33:23:58, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:12:29<33:23:58, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:12:36<33:22:46, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:12:36<33:22:46, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:38,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:12:43<33:22:17, 7.01s/it]g-point operations will not be computed-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:12:43<33:22:17, 7.01s/it]g-point operations will not be computed-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2991, 'learning_rate': 7.11e-05, 'epoch': 0.8} + 4%|██▉ | 713/17840 [1:12:43<33:22:17, 7.01s/it]g-point operations will not be computed-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:12:43<33:22:17, 7.01s/it]g-point operations will not be computed-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:12:43<33:22:17, 7.01s/it]g-point operations will not be computed-17 17:53:28,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:12:50<33:19:24, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:12:50<33:19:24, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:12:50<33:19:24, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:12:57<33:06:58, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:12:57<33:06:58, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5305, 'learning_rate': 7.13e-05, 'epoch': 0.8} + 4%|██▉ | 715/17840 [1:12:57<33:06:58, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:01,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:01,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3216, 'learning_rate': 7.14e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:01,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:01,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:13:11<32:48:31, 6.90s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:13:11<32:48:31, 6.90s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:11,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:11,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:13:17<32:39:42, 6.87s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:13:17<32:39:42, 6.87s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2857, 'learning_rate': 7.16e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:19,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:13:24<32:17:55, 6.79s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:13:24<32:17:55, 6.79s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2233, 'learning_rate': 7.17e-05, 'epoch': 0.81} + 4%|██▉ | 719/17840 [1:13:24<32:17:55, 6.79s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:28,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:28,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4634, 'learning_rate': 7.18e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:28,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:28,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:13:37<32:03:25, 6.74s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:13:37<32:03:25, 6.74s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.177, 'learning_rate': 7.19e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:39,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:13:44<31:49:32, 6.69s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:13:44<31:49:32, 6.69s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2175, 'learning_rate': 7.2e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:46,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:13:50<31:39:49, 6.66s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:13:50<31:39:49, 6.66s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3338, 'learning_rate': 7.21e-05, 'epoch': 0.81} + 4%|██▉ | 723/17840 [1:13:50<31:39:49, 6.66s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:13:50<31:39:49, 6.66s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:13:50<31:39:49, 6.66s/it]g-point operations will not be computed-17 17:53:49,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:13:57<31:30:15, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:13:57<31:30:15, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:13:57<31:30:15, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:14:06<34:37:54, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:14:06<34:37:54, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3544, 'learning_rate': 7.23e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:08,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:14:13<33:46:34, 7.10s/it]g-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:14:13<33:46:34, 7.10s/it]g-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6157, 'learning_rate': 7.24e-05, 'epoch': 0.81} + 4%|███ | 726/17840 [1:14:13<33:46:34, 7.10s/it]g-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:16,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:16,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.446, 'learning_rate': 7.25e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:16,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:16,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:22,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:22,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:22,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:22,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:28,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:28,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:28,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:28,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:35,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:35,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:35,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:41,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:41,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6889, 'learning_rate': 7.29e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:41,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:41,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:41,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:56,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:14:50<29:56:54, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:49,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:14:50<29:56:54, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:49,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:14:50<29:56:54, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:49,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:14:50<29:56:54, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:49,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:14:56<29:37:56, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:14:56<29:37:56, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:14:56<29:37:56, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:59,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:59,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:03,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:03,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 735/17840 [1:15:08<28:28:24, 5.99s/it]g-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 735/17840 [1:15:08<28:28:24, 5.99s/it]g-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:09,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:09,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 736/17840 [1:15:13<28:01:55, 5.90s/it]g-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:13,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:13,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:13,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:55,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 737/17840 [1:15:19<27:30:12, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 737/17840 [1:15:19<27:30:12, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 737/17840 [1:15:19<27:30:12, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:21,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:21,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:25,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:25,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 739/17840 [1:15:29<26:10:03, 5.51s/it]g-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:29,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:31,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:31,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6041, 'learning_rate': 7.38e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:35,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:35,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:17,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 741/17840 [1:15:39<24:35:03, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:40,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:40,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 742/17840 [1:15:44<23:54:20, 5.03s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:43,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:43,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:45,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:47,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:47,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:49,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:51,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:51,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:53,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:55,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:55,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:58,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:58,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:01,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:01,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:04,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:04,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:05,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:06,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:06,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:09,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:09,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:13,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:13,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:13,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:17,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:17,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:17,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:17,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:17,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:16:27<26:32:10, 5.59s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:16:27<26:32:10, 5.59s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:30,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:16:35<29:14:21, 6.16s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:16:35<29:14:21, 6.16s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4927, 'learning_rate': 7.510000000000001e-05, 'epoch': 0.84} + 4%|███ | 753/17840 [1:16:35<29:14:21, 6.16s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:16:35<29:14:21, 6.16s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:16:35<29:14:21, 6.16s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:16:42<30:56:19, 6.52s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:16:42<30:56:19, 6.52s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:16:42<30:56:19, 6.52s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:46,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:46,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.472, 'learning_rate': 7.53e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:52,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 756/17840 [1:16:57<32:52:42, 6.93s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 756/17840 [1:16:57<32:52:42, 6.93s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4566, 'learning_rate': 7.54e-05, 'epoch': 0.85} + 4%|███▏ | 756/17840 [1:16:57<32:52:42, 6.93s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 756/17840 [1:16:57<32:52:42, 6.93s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 756/17840 [1:16:57<32:52:42, 6.93s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:17:04<33:12:36, 7.00s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:17:04<33:12:36, 7.00s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:17:04<33:12:36, 7.00s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:08,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:08,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4564, 'learning_rate': 7.560000000000001e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:08,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:08,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:08,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:17:18<33:34:02, 7.07s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:17:18<33:34:02, 7.07s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:21,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 760/17840 [1:17:26<33:40:23, 7.10s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 760/17840 [1:17:26<33:40:23, 7.10s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3836, 'learning_rate': 7.58e-05, 'epoch': 0.85} + 4%|███▏ | 760/17840 [1:17:26<33:40:23, 7.10s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 760/17840 [1:17:26<33:40:23, 7.10s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 760/17840 [1:17:26<33:40:23, 7.10s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 761/17840 [1:17:32<33:29:38, 7.06s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:33,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:33,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:17:40<33:25:23, 7.05s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:17:40<33:25:23, 7.05s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4167, 'learning_rate': 7.6e-05, 'epoch': 0.85} + 4%|███▏ | 762/17840 [1:17:40<33:25:23, 7.05s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:43,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:43,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3325, 'learning_rate': 7.61e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:43,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:43,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:43,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:17:53<33:12:08, 7.00s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:17:53<33:12:08, 7.00s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:17:53<33:12:08, 7.00s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:57,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:57,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5169, 'learning_rate': 7.630000000000001e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:57,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:57,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:57,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:18:07<32:57:52, 6.95s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:08,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:08,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:18:14<32:47:56, 6.92s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:18:14<32:47:56, 6.92s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.277, 'learning_rate': 7.65e-05, 'epoch': 0.86} + 4%|███▏ | 767/17840 [1:18:14<32:47:56, 6.92s/it]g-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:18,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:18,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3775, 'learning_rate': 7.66e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:18,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:18,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:18,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:18:28<32:31:32, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:18:28<32:31:32, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:18:28<32:31:32, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 770/17840 [1:18:34<32:25:24, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 770/17840 [1:18:34<32:25:24, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3647, 'learning_rate': 7.680000000000001e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:36,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:18:41<32:18:04, 6.81s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:18:41<32:18:04, 6.81s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2901, 'learning_rate': 7.69e-05, 'epoch': 0.86} + 4%|███▏ | 771/17840 [1:18:41<32:18:04, 6.81s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:45,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:45,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4022, 'learning_rate': 7.7e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:48,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:48,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:18:55<32:08:01, 6.78s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:18:55<32:08:01, 6.78s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6164, 'learning_rate': 7.71e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:57,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:19:01<32:03:09, 6.76s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:19:01<32:03:09, 6.76s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1116, 'learning_rate': 7.72e-05, 'epoch': 0.87} + 4%|███▏ | 774/17840 [1:19:01<32:03:09, 6.76s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:19:01<32:03:09, 6.76s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:19:01<32:03:09, 6.76s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 775/17840 [1:19:11<35:14:10, 7.43s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:11,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:11,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 776/17840 [1:19:17<33:58:42, 7.17s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 776/17840 [1:19:17<33:58:42, 7.17s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:17,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:17,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 777/17840 [1:19:23<32:59:19, 6.96s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 777/17840 [1:19:23<32:59:19, 6.96s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1241, 'learning_rate': 7.75e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:25,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:19:30<32:13:37, 6.80s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:19:30<32:13:37, 6.80s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4284, 'learning_rate': 7.76e-05, 'epoch': 0.87} + 4%|███▏ | 778/17840 [1:19:30<32:13:37, 6.80s/it]g-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:33,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:33,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3613, 'learning_rate': 7.77e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:33,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:40,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:40,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.339, 'learning_rate': 7.780000000000001e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:40,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:40,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:40,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:26,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:19:49<30:42:00, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:47,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:19:49<30:42:00, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:47,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:19:49<30:42:00, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:47,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:19:49<30:42:00, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:47,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:55<30:17:44, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:54,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:55<30:17:44, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:54,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:55<30:17:44, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:54,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:55<30:17:44, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:54,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:20:01<29:52:33, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:20:01<29:52:33, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:04,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:04,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2081, 'learning_rate': 7.82e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:04,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:04,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:10,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:10,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:14,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:14,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 786/17840 [1:20:19<28:30:04, 6.02s/it]g-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:19,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:19,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:19,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 787/17840 [1:20:24<27:55:26, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 787/17840 [1:20:24<27:55:26, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:27,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:27,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4428, 'learning_rate': 7.860000000000001e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:31,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:31,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 789/17840 [1:20:35<26:42:45, 5.64s/it]g-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:35,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:35,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:35,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:23,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 790/17840 [1:20:40<26:01:38, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:41,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:41,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 791/17840 [1:20:46<25:28:20, 5.38s/it]g-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:45,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:47,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:47,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2547, 'learning_rate': 7.900000000000001e-05, 'epoch': 0.89} +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:51,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:51,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:39,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 793/17840 [1:20:55<23:41:55, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 793/17840 [1:20:55<23:41:55, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 793/17840 [1:20:55<23:41:55, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:56,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:58,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:58,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:00,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:03,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:03,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:05,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:05,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:06,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:06,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:09,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:10,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:10,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:13,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:13,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:15,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:15,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:20,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:20,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:20,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:28,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:31,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:31,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3059, 'learning_rate': 8e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:31,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:31,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:31,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:42<29:33:08, 6.24s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:42<29:33:08, 6.24s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:42<29:33:08, 6.24s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:42<29:33:08, 6.24s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:42<29:33:08, 6.24s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:21:49<31:04:58, 6.57s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:21:49<31:04:58, 6.57s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:52,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:52,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:21:57<32:13:00, 6.81s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:21:57<32:13:00, 6.81s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:21:57<32:13:00, 6.81s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:21:57<32:13:00, 6.81s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:21:57<32:13:00, 6.81s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:22:04<32:57:02, 6.96s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:22:04<32:57:02, 6.96s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:22:04<32:57:02, 6.96s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:22:04<32:57:02, 6.96s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:22:04<32:57:02, 6.96s/it]g-point operations will not be computed-17 18:01:53,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:22:11<33:21:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:22:11<33:21:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:22:11<33:21:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:22:11<33:21:49, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:22:18<33:33:31, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:22:18<33:33:31, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:22:18<33:33:31, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:22,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:22,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6393, 'learning_rate': 8.070000000000001e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:22,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:22,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:22,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:22:33<33:31:24, 7.09s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:22:33<33:31:24, 7.09s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:22:33<33:31:24, 7.09s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:37,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:37,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6519, 'learning_rate': 8.090000000000001e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:37,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:37,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:37,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:22:47<33:19:20, 7.04s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:22:47<33:19:20, 7.04s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:49,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:22:54<33:12:59, 7.02s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:22:54<33:12:59, 7.02s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2308, 'learning_rate': 8.11e-05, 'epoch': 0.91} + 5%|███▎ | 813/17840 [1:22:54<33:12:59, 7.02s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:22:54<33:12:59, 7.02s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:22:54<33:12:59, 7.02s/it]g-point operations will not be computed-17 18:03:10,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:23:01<33:01:09, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:23:01<33:01:09, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:23:01<33:01:09, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:23:01<33:01:09, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:23:07<32:59:09, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:23:07<32:59:09, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:23:07<32:59:09, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:11,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:11,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3746, 'learning_rate': 8.14e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:11,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:11,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:11,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:03:59,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:23:21<32:41:40, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:23:21<32:41:40, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:23:21<32:41:40, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:23:28<32:26:01, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:23:28<32:26:01, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3887, 'learning_rate': 8.16e-05, 'epoch': 0.92} + 5%|███▍ | 818/17840 [1:23:28<32:26:01, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:32,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:32,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4195, 'learning_rate': 8.17e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:32,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:32,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:32,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:23:42<32:16:26, 6.83s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:42,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:42,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:23:48<32:03:25, 6.78s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:23:48<32:03:25, 6.78s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5771, 'learning_rate': 8.19e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:50,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:23:55<31:52:22, 6.74s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:23:55<31:52:22, 6.74s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3105, 'learning_rate': 8.2e-05, 'epoch': 0.92} + 5%|███▍ | 822/17840 [1:23:55<31:52:22, 6.74s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:23:55<31:52:22, 6.74s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:23:55<31:52:22, 6.74s/it]g-point operations will not be computed-17 18:04:20,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:24:01<31:38:45, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:24:01<31:38:45, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:24:01<31:38:45, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:24:01<31:38:45, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:24:08<31:28:40, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:08,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:08,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:24:17<34:38:42, 7.33s/it]g-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:24:17<34:38:42, 7.33s/it]g-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5652, 'learning_rate': 8.23e-05, 'epoch': 0.92} + 5%|███�� | 825/17840 [1:24:17<34:38:42, 7.33s/it]g-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:20,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:20,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3825, 'learning_rate': 8.24e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:20,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:27,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:27,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3019, 'learning_rate': 8.25e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:27,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:33,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:33,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1977, 'learning_rate': 8.26e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:33,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:33,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:33,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:00,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:24:42<31:10:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:24:42<31:10:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:24:42<31:10:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:24:42<31:10:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 830/17840 [1:24:49<30:34:28, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:49,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:49,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:49,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:05:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:24:55<30:11:26, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:53,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:24:55<30:11:26, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:53,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:24:55<30:11:26, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:53,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:24:55<30:11:26, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:53,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:25:01<29:46:18, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:59,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:25:01<29:46:18, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:59,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:25:01<29:46:18, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:59,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:25:01<29:46:18, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:05:59,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:25:07<29:26:53, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:06,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:25:07<29:26:53, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:06,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:25:07<29:26:53, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:06,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:25:07<29:26:53, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:06,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:25:13<28:59:19, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:25:13<28:59:19, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:16,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:16,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3565, 'learning_rate': 8.33e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:20,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 836/17840 [1:25:24<28:01:26, 5.93s/it]g-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 836/17840 [1:25:24<28:01:26, 5.93s/it]g-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4969, 'learning_rate': 8.34e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:26,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 837/17840 [1:25:30<27:25:05, 5.81s/it]g-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 837/17840 [1:25:30<27:25:05, 5.81s/it]g-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:30,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:30,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:32,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:32,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:36,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:36,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 839/17840 [1:25:40<26:05:14, 5.52s/it]g-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:40,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:40,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:42,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:42,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:46,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:46,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:11,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 841/17840 [1:25:50<24:13:08, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:48,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:50,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:48,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:50,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:48,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 842/17840 [1:25:55<23:20:31, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:53,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:54,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:53,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:54,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:53,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 843/17840 [1:25:59<22:01:12, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:57,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:58,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:57,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:58,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:57,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 844/17840 [1:26:02<20:47:26, 4.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:00,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 845/17840 [1:26:06<19:17:26, 4.09s/it]g-point operations will not be computed-17 18:07:00,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 845/17840 [1:26:06<19:17:26, 4.09s/it]g-point operations will not be computed-17 18:07:00,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:05,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:03,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:05,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:03,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 846/17840 [1:26:09<17:46:05, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:06,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 846/17840 [1:26:09<17:46:05, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:06,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 847/17840 [1:26:11<16:21:28, 3.47s/it]g-point operations will not be computed-17 18:07:06,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 848/17840 [1:26:14<15:01:56, 3.18s/it]g-point operations will not be computed-17 18:07:09,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 848/17840 [1:26:14<15:01:56, 3.18s/it]g-point operations will not be computed-17 18:07:09,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:13,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:12,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:13,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:12,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:15,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:14,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:15,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:14,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:26:21<15:29:59, 3.28s/it]g-point operations will not be computed-17 18:07:14,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:26:21<15:29:59, 3.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:20,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:26:21<15:29:59, 3.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:20,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:23,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:20,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:23,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:20,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:26:28<22:02:14, 4.67s/it]g-point operations will not be computed-17 18:07:20,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:26:28<22:02:14, 4.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:27,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:31,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:27,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:26:36<26:18:32, 5.58s/it]g-point operations will not be computed-17 18:07:27,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:26:36<26:18:32, 5.58s/it]g-point operations will not be computed-17 18:07:27,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:26:36<26:18:32, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:26:36<26:18:32, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:26:36<26:18:32, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:26:36<26:18:32, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:44<29:05:22, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:44<29:05:22, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:44<29:05:22, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:44<29:05:22, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:44<29:05:22, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 854/17840 [1:26:51<30:51:47, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:52,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:52,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:58<32:00:05, 6.78s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:58<32:00:05, 6.78s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3507, 'learning_rate': 8.53e-05, 'epoch': 0.96} + 5%|███▌ | 855/17840 [1:26:58<32:00:05, 6.78s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:58<32:00:05, 6.78s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:58<32:00:05, 6.78s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 856/17840 [1:27:06<32:36:43, 6.91s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 856/17840 [1:27:06<32:36:43, 6.91s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 856/17840 [1:27:06<32:36:43, 6.91s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:10,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:10,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.508, 'learning_rate': 8.55e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:10,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:10,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:10,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:27:20<33:21:30, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:27:20<33:21:30, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:22,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:27<33:21:11, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:27<33:21:11, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1824, 'learning_rate': 8.57e-05, 'epoch': 0.96} + 5%|███▌ | 859/17840 [1:27:27<33:21:11, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:27<33:21:11, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:27<33:21:11, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:27:34<33:19:43, 7.07s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:35,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:35,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:27:41<33:11:35, 7.04s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:27:41<33:11:35, 7.04s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5717, 'learning_rate': 8.59e-05, 'epoch': 0.97} + 5%|███▌ | 861/17840 [1:27:41<33:11:35, 7.04s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:27:41<33:11:35, 7.04s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:27:41<33:11:35, 7.04s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 862/17840 [1:27:48<33:00:29, 7.00s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:48,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:48,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:27:55<32:58:46, 6.99s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:27:55<32:58:46, 6.99s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4994, 'learning_rate': 8.61e-05, 'epoch': 0.97} + 5%|███▌ | 863/17840 [1:27:55<32:58:46, 6.99s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7893, 'learning_rate': 8.620000000000001e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 865/17840 [1:28:09<32:28:32, 6.89s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:09,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:09,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 866/17840 [1:28:15<32:21:35, 6.86s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 866/17840 [1:28:15<32:21:35, 6.86s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3603, 'learning_rate': 8.64e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:17,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:28:22<32:08:16, 6.82s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:28:22<32:08:16, 6.82s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4277, 'learning_rate': 8.65e-05, 'epoch': 0.97} + 5%|███▌ | 867/17840 [1:28:22<32:08:16, 6.82s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:28:22<32:08:16, 6.82s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:28:22<32:08:16, 6.82s/it]g-point operations will not be computed-17 18:07:35,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:28:29<32:01:16, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:28:29<32:01:16, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:28:29<32:01:16, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:28:36<31:56:06, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:28:36<31:56:06, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:36,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:36,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:28:42<31:42:43, 6.73s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:28:42<31:42:43, 6.73s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7087, 'learning_rate': 8.680000000000001e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:44,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:28:49<31:27:08, 6.67s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:28:49<31:27:08, 6.67s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.36, 'learning_rate': 8.69e-05, 'epoch': 0.98} + 5%|███▌ | 871/17840 [1:28:49<31:27:08, 6.67s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:52,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:52,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4872, 'learning_rate': 8.7e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:52,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:52,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:29:02<31:05:58, 6.60s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:29:02<31:05:58, 6.60s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:02,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:02,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:29:08<30:46:54, 6.53s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:29:08<30:46:54, 6.53s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:08,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:08,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:29:17<33:53:57, 7.19s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:29:17<33:53:57, 7.19s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.73, 'learning_rate': 8.730000000000001e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:19,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:29:23<32:44:49, 6.95s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:29:23<32:44:49, 6.95s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3078, 'learning_rate': 8.740000000000001e-05, 'epoch': 0.98} + 5%|███▋ | 876/17840 [1:29:23<32:44:49, 6.95s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:29:23<32:44:49, 6.95s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:26,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:26,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:31,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:31,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:29:36<30:49:59, 6.54s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:29:36<30:49:59, 6.54s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:37,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:37,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 879/17840 [1:29:42<29:52:07, 6.34s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:41,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:41,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:41,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 880/17840 [1:29:47<29:05:21, 6.17s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:47,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:47,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:47,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 881/17840 [1:29:53<28:21:26, 6.02s/it]g-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:28,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:29:59<27:43:42, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:57,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:29:59<27:43:42, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:57,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:29:59<27:43:42, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:57,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:01,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:57,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:03,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:57,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:03,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:57,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:03,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:57,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 884/17840 [1:30:09<25:47:52, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:07,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:09,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:07,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:09,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:07,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 885/17840 [1:30:13<24:31:42, 5.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:11,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:13,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:11,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:13,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:11,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 886/17840 [1:30:18<23:11:32, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:16,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:18,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:16,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:18,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:16,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 887/17840 [1:30:22<21:57:02, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:20,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:21,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:20,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:21,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:20,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 888/17840 [1:30:25<20:21:30, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:23,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 889/17840 [1:30:28<18:46:04, 3.99s/it]g-point operations will not be computed-17 18:11:23,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 889/17840 [1:30:28<18:46:04, 3.99s/it]g-point operations will not be computed-17 18:11:23,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:27,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:27,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 890/17840 [1:30:31<17:08:36, 3.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:29,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 890/17840 [1:30:31<17:08:36, 3.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:29,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 891/17840 [1:30:34<15:23:29, 3.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:31,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 891/17840 [1:30:34<15:23:29, 3.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:31,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:30:36<13:46:58, 2.93s/it]g-point operations will not be computed-17 18:11:31,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:30:36<13:46:58, 2.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:35,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:30:36<13:46:58, 2.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:35,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:39,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:35,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:39,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:35,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:44<21:05:59, 4.48s/it]g-point operations will not be computed-17 18:11:35,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:44<21:05:59, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:44<21:05:59, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:44<21:05:59, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:44<21:05:59, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:52<25:40:51, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:52<25:40:51, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:52<25:40:51, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:52<25:40:51, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:52<25:40:51, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:43,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:30:59<28:29:54, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:30:59<28:29:54, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:30:59<28:29:54, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:30:59<28:29:54, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:31:06<30:27:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:31:06<30:27:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:31:06<30:27:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:31:06<30:27:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:31:06<30:27:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:31:14<31:47:41, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:31:14<31:47:41, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:31:14<31:47:41, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:18,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:18,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3585, 'learning_rate': 8.960000000000001e-05, 'epoch': 1.01} +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:18,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:18,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:18,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:29<33:09:24, 7.05s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:29<33:09:24, 7.05s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:29<33:09:24, 7.05s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:29<33:09:24, 7.05s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:29<33:09:24, 7.05s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:31:38<36:48:50, 7.82s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:31:38<36:48:50, 7.82s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:41,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:31:45<36:03:46, 7.66s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:31:45<36:03:46, 7.66s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1974, 'learning_rate': 8.99e-05, 'epoch': 1.01} + 5%|███▋ | 901/17840 [1:31:45<36:03:46, 7.66s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:31:45<36:03:46, 7.66s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:31:45<36:03:46, 7.66s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:31:53<35:25:37, 7.53s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:31:53<35:25:37, 7.53s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:55,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:32:00<34:44:26, 7.38s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:32:00<34:44:26, 7.38s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9527, 'learning_rate': 9.010000000000001e-05, 'epoch': 1.01} + 5%|███▋ | 903/17840 [1:32:00<34:44:26, 7.38s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:32:00<34:44:26, 7.38s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:32:00<34:44:26, 7.38s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 904/17840 [1:32:07<34:15:21, 7.28s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:07,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:07,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:32:14<33:46:07, 7.18s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:32:14<33:46:07, 7.18s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1762, 'learning_rate': 9.030000000000001e-05, 'epoch': 1.01} + 5%|███▊ | 905/17840 [1:32:14<33:46:07, 7.18s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:32:14<33:46:07, 7.18s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:32:14<33:46:07, 7.18s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:32:21<33:27:38, 7.11s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:21,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:21,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:32:28<33:03:17, 7.03s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:32:28<33:03:17, 7.03s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3478, 'learning_rate': 9.05e-05, 'epoch': 1.02} + 5%|███▊ | 907/17840 [1:32:28<33:03:17, 7.03s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:31,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:31,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3365, 'learning_rate': 9.06e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:31,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:31,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:31,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:32:41<32:29:21, 6.91s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:41,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:41,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:32:48<32:15:33, 6.86s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:32:48<32:15:33, 6.86s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1506, 'learning_rate': 9.080000000000001e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:50,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:32:55<32:07:44, 6.83s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:32:55<32:07:44, 6.83s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0467, 'learning_rate': 9.090000000000001e-05, 'epoch': 1.02} + 5%|███▊ | 911/17840 [1:32:55<32:07:44, 6.83s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:32:55<32:07:44, 6.83s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:32:55<32:07:44, 6.83s/it]g-point operations will not be computed-17 18:11:58,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:33:01<31:58:34, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:33:01<31:58:34, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:33:01<31:58:34, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:33:01<31:58:34, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 913/17840 [1:33:08<31:50:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:08,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:08,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:33:15<31:37:50, 6.73s/it]g-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:33:15<31:37:50, 6.73s/it]g-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3801, 'learning_rate': 9.120000000000001e-05, 'epoch': 1.02} + 5%|███▊ | 914/17840 [1:33:15<31:37:50, 6.73s/it]g-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8849, 'learning_rate': 9.130000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:33:28<31:14:57, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:33:28<31:14:57, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:33:28<31:14:57, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:33:28<31:14:57, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:33:34<31:02:56, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:34,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:34,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 918/17840 [1:33:41<30:39:36, 6.52s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 918/17840 [1:33:41<30:39:36, 6.52s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:41,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:41,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:33:47<30:25:25, 6.47s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:33:47<30:25:25, 6.47s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:47,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:47,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:33:53<30:17:13, 6.44s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:33:53<30:17:13, 6.44s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0633, 'learning_rate': 9.180000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:55,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 921/17840 [1:34:00<30:07:24, 6.41s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 921/17840 [1:34:00<30:07:24, 6.41s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8317, 'learning_rate': 9.190000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:01,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 922/17840 [1:34:06<29:46:27, 6.34s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 922/17840 [1:34:06<29:46:27, 6.34s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2174, 'learning_rate': 9.200000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 923/17840 [1:34:12<29:42:54, 6.32s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 923/17840 [1:34:12<29:42:54, 6.32s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.418, 'learning_rate': 9.21e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:14,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:14,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 924/17840 [1:34:18<29:27:01, 6.27s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 924/17840 [1:34:18<29:27:01, 6.27s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:20,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:20,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:34:27<32:30:20, 6.92s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:34:27<32:30:20, 6.92s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:34:27<32:30:20, 6.92s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:34:27<32:30:20, 6.92s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:30,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:30,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:34,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:34,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 927/17840 [1:34:39<30:06:28, 6.41s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:38,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:38,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:38,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 928/17840 [1:34:44<29:09:42, 6.21s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:44,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:44,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:44,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:34:50<28:24:11, 6.05s/it]g-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:50,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:50,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:50,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:14:26,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 930/17840 [1:34:55<27:36:17, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:15:54,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:56,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:54,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:56,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:54,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 931/17840 [1:35:01<26:52:09, 5.72s/it]g-point operations will not be computed-17 18:15:54,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:00,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:54,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:00,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:54,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:00,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:54,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 932/17840 [1:35:06<26:09:56, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 932/17840 [1:35:06<26:09:56, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 932/17840 [1:35:06<26:09:56, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:08,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:10,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:13,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:13,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1431, 'learning_rate': 9.320000000000002e-05, 'epoch': 1.05} +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:16,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:16,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:04,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 935/17840 [1:35:20<23:22:49, 4.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:18,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:20,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:18,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:20,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:18,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 936/17840 [1:35:24<22:16:36, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:22,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:24,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:22,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:24,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:22,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 937/17840 [1:35:28<20:59:50, 4.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:26,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 938/17840 [1:35:32<19:43:31, 4.20s/it]g-point operations will not be computed-17 18:16:26,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 938/17840 [1:35:32<19:43:31, 4.20s/it]g-point operations will not be computed-17 18:16:26,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:31,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:30,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:31,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:30,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 939/17840 [1:35:35<18:02:40, 3.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:33,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 940/17840 [1:35:38<16:24:16, 3.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:35,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 940/17840 [1:35:38<16:24:16, 3.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:35,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 941/17840 [1:35:40<14:49:29, 3.16s/it]g-point operations will not be computed-17 18:16:35,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 941/17840 [1:35:40<14:49:29, 3.16s/it]g-point operations will not be computed-17 18:16:35,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:35:42<13:26:23, 2.86s/it]g-point operations will not be computed-17 18:16:38,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:35:42<13:26:23, 2.86s/it]g-point operations will not be computed-17 18:16:38,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:35:42<13:26:23, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:41,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:35:42<13:26:23, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:41,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:45,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:41,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 943/17840 [1:35:50<20:22:44, 4.34s/it]g-point operations will not be computed-17 18:16:41,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 943/17840 [1:35:50<20:22:44, 4.34s/it]g-point operations will not be computed-17 18:16:41,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 943/17840 [1:35:50<20:22:44, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 943/17840 [1:35:50<20:22:44, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:53,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:53,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:57<24:55:45, 5.31s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:57<24:55:45, 5.31s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:57<24:55:45, 5.31s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:57<24:55:45, 5.31s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:57<24:55:45, 5.31s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:36:05<27:58:39, 5.96s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:06,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:06,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:36:12<30:03:55, 6.41s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:36:12<30:03:55, 6.41s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0815, 'learning_rate': 9.44e-05, 'epoch': 1.06} + 5%|███▉ | 946/17840 [1:36:12<30:03:55, 6.41s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:36:12<30:03:55, 6.41s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:36:12<30:03:55, 6.41s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:36:20<31:25:54, 6.70s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:36:20<31:25:54, 6.70s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:22,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:36:27<32:18:36, 6.89s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:36:27<32:18:36, 6.89s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3819, 'learning_rate': 9.46e-05, 'epoch': 1.06} + 5%|███▉ | 948/17840 [1:36:27<32:18:36, 6.89s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:36:27<32:18:36, 6.89s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:36:34<32:53:30, 7.01s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:36:34<32:53:30, 7.01s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9344, 'learning_rate': 9.47e-05, 'epoch': 1.06} + 5%|███▉ | 949/17840 [1:36:34<32:53:30, 7.01s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:36:34<32:53:30, 7.01s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:36:34<32:53:30, 7.01s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:36:44<36:44:57, 7.83s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:36:44<36:44:57, 7.83s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:47,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 951/17840 [1:36:51<35:57:27, 7.66s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 951/17840 [1:36:51<35:57:27, 7.66s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0066, 'learning_rate': 9.49e-05, 'epoch': 1.07} + 5%|███▉ | 951/17840 [1:36:51<35:57:27, 7.66s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 951/17840 [1:36:51<35:57:27, 7.66s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 952/17840 [1:36:59<35:08:35, 7.49s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 952/17840 [1:36:59<35:08:35, 7.49s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6464, 'learning_rate': 9.5e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:01,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:37:06<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:37:06<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2886, 'learning_rate': 9.51e-05, 'epoch': 1.07} + 5%|███▉ | 953/17840 [1:37:06<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:37:06<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:37:06<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:37:13<34:08:45, 7.28s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:37:13<34:08:45, 7.28s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:15,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:37:20<33:49:03, 7.21s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:37:20<33:49:03, 7.21s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4614, 'learning_rate': 9.53e-05, 'epoch': 1.07} + 5%|███▉ | 955/17840 [1:37:20<33:49:03, 7.21s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:37:20<33:49:03, 7.21s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:37:20<33:49:03, 7.21s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:37:27<33:26:49, 7.13s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:27,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:27,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:37:34<33:03:17, 7.05s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:37:34<33:03:17, 7.05s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1165, 'learning_rate': 9.55e-05, 'epoch': 1.07} + 5%|███▉ | 957/17840 [1:37:34<33:03:17, 7.05s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:37,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:37,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0898, 'learning_rate': 9.56e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:37,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:37,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:37,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:37:47<32:43:41, 6.98s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:37:47<32:43:41, 6.98s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:49,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:37:54<32:23:10, 6.91s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:37:54<32:23:10, 6.91s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9989, 'learning_rate': 9.58e-05, 'epoch': 1.08} + 5%|███▉ | 960/17840 [1:37:54<32:23:10, 6.91s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:37:54<32:23:10, 6.91s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:37:54<32:23:10, 6.91s/it]g-point operations will not be computed-17 18:16:49,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:38:01<32:10:40, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:38:01<32:10:40, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:38:01<32:10:40, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:38:08<31:59:16, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:38:08<31:59:16, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:08,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:08,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 963/17840 [1:38:14<31:43:09, 6.77s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 963/17840 [1:38:14<31:43:09, 6.77s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3636, 'learning_rate': 9.61e-05, 'epoch': 1.08} + 5%|███▉ | 963/17840 [1:38:14<31:43:09, 6.77s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:18,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:18,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4926, 'learning_rate': 9.620000000000001e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:18,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:18,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:18,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:38:27<31:16:03, 6.67s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:28,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:28,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:28,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 966/17840 [1:38:34<30:56:52, 6.60s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:34,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:34,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:38:40<30:39:46, 6.54s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:38:40<30:39:46, 6.54s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2967, 'learning_rate': 9.65e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:42,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:38:47<30:24:49, 6.49s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:38:47<30:24:49, 6.49s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0922, 'learning_rate': 9.66e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:48,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:38:53<30:05:38, 6.42s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:38:53<30:05:38, 6.42s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.198, 'learning_rate': 9.67e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:54,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 970/17840 [1:38:59<29:50:06, 6.37s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 970/17840 [1:38:59<29:50:06, 6.37s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0354, 'learning_rate': 9.680000000000001e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:01,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 971/17840 [1:39:05<29:40:54, 6.33s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 971/17840 [1:39:05<29:40:54, 6.33s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3444, 'learning_rate': 9.69e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:07,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:39:12<29:34:51, 6.31s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:39:12<29:34:51, 6.31s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2437, 'learning_rate': 9.7e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:13,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 973/17840 [1:39:18<29:23:22, 6.27s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 973/17840 [1:39:18<29:23:22, 6.27s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3317, 'learning_rate': 9.71e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:19,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:39:24<29:00:59, 6.19s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:39:24<29:00:59, 6.19s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.417, 'learning_rate': 9.72e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:25,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:25,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:39:32<32:08:07, 6.86s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:39:32<32:08:07, 6.86s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:34,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:34,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 976/17840 [1:39:38<30:50:52, 6.59s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 976/17840 [1:39:38<30:50:52, 6.59s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:39,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:39,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 977/17840 [1:39:44<29:32:48, 6.31s/it]g-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:44,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:44,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:44,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:00,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:39:49<28:36:44, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:39:49<28:36:44, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:52,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:52,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9394, 'learning_rate': 9.77e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:56,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:56,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 980/17840 [1:40:00<26:53:06, 5.74s/it]g-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:00,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:00,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:00,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 981/17840 [1:40:05<26:04:03, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 981/17840 [1:40:05<26:04:03, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 981/17840 [1:40:05<26:04:03, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:07,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:10,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:12,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:12,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:14,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:16,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:16,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3604, 'learning_rate': 9.82e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:19,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:19,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:04,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 985/17840 [1:40:23<21:54:45, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:21,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 986/17840 [1:40:27<20:39:09, 4.41s/it]g-point operations will not be computed-17 18:21:21,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 986/17840 [1:40:27<20:39:09, 4.41s/it]g-point operations will not be computed-17 18:21:21,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 986/17840 [1:40:27<20:39:09, 4.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:25,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 986/17840 [1:40:27<20:39:09, 4.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:25,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 987/17840 [1:40:31<19:17:18, 4.12s/it]g-point operations will not be computed-17 18:21:25,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:30,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:28,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:30,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:28,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 988/17840 [1:40:34<17:42:01, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:31,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 988/17840 [1:40:34<17:42:01, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:31,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 989/17840 [1:40:36<16:17:03, 3.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:34,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 989/17840 [1:40:36<16:17:03, 3.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:34,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 990/17840 [1:40:39<14:47:14, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:36,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 990/17840 [1:40:39<14:47:14, 3.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:36,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 991/17840 [1:40:41<13:31:01, 2.89s/it]g-point operations will not be computed-17 18:21:36,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 992/17840 [1:40:43<12:26:39, 2.66s/it]g-point operations will not be computed-17 18:21:39,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 992/17840 [1:40:43<12:26:39, 2.66s/it]g-point operations will not be computed-17 18:21:39,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 992/17840 [1:40:43<12:26:39, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:42,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 992/17840 [1:40:43<12:26:39, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:42,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:46,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:42,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:46,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:42,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 993/17840 [1:40:51<19:40:07, 4.20s/it]g-point operations will not be computed-17 18:21:42,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 993/17840 [1:40:51<19:40:07, 4.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:50,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 993/17840 [1:40:51<19:40:07, 4.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:50,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:54,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:50,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:54,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:50,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 994/17840 [1:40:59<24:35:21, 5.25s/it]g-point operations will not be computed-17 18:21:50,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 994/17840 [1:40:59<24:35:21, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 994/17840 [1:40:59<24:35:21, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 994/17840 [1:40:59<24:35:21, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 994/17840 [1:40:59<24:35:21, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 995/17840 [1:41:06<27:51:50, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 995/17840 [1:41:06<27:51:50, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:09,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:09,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:41:14<29:55:11, 6.39s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:41:14<29:55:11, 6.39s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:41:14<29:55:11, 6.39s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:41:14<29:55:11, 6.39s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:41:14<29:55:11, 6.39s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:41:21<31:11:49, 6.67s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:41:21<31:11:49, 6.67s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:41:21<31:11:49, 6.67s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:41:21<31:11:49, 6.67s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:41:21<31:11:49, 6.67s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:41:28<32:00:56, 6.84s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:29,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:29,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:29,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:41:36<32:39:37, 6.98s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:41:36<32:39:37, 6.98s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:41:36<32:39:37, 6.98s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:41:36<32:39:37, 6.98s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:41:36<32:39:37, 6.98s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:41:45<36:36:01, 7.82s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:41:45<36:36:01, 7.82s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:41:45<36:36:01, 7.82s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:50,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:50,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2591, 'learning_rate': 9.99e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:50,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:50,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:50,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:42:00<34:54:45, 7.46s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:42:07<34:19:35, 7.34s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:42:07<34:19:35, 7.34s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1982, 'learning_rate': 9.999406175771971e-05, 'epoch': 1.12} + 6%|████ | 1003/17840 [1:42:07<34:19:35, 7.34s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:42:07<34:19:35, 7.34s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:42:07<34:19:35, 7.34s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1004/17840 [1:42:14<33:52:20, 7.24s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:14,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:14,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:42:21<33:31:52, 7.17s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:42:21<33:31:52, 7.17s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3278, 'learning_rate': 9.998218527315915e-05, 'epoch': 1.13} + 6%|████ | 1005/17840 [1:42:21<33:31:52, 7.17s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2707, 'learning_rate': 9.997624703087887e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:25,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:42:35<32:50:01, 7.02s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:42:35<32:50:01, 7.02s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:37,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:42:41<32:34:39, 6.97s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:42:41<32:34:39, 6.97s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2997, 'learning_rate': 9.99643705463183e-05, 'epoch': 1.13} + 6%|████ | 1008/17840 [1:42:41<32:34:39, 6.97s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:42:41<32:34:39, 6.97s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:42:41<32:34:39, 6.97s/it]g-point operations will not be computed-17 18:21:58,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1009/17840 [1:42:48<32:26:15, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1009/17840 [1:42:48<32:26:15, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1009/17840 [1:42:48<32:26:15, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:42:55<32:16:15, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:42:55<32:16:15, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1074, 'learning_rate': 9.995249406175773e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:57,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:43:02<32:08:41, 6.88s/it]g-point operations will not be computed-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:43:02<32:08:41, 6.88s/it]g-point operations will not be computed-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1079, 'learning_rate': 9.994655581947743e-05, 'epoch': 1.13} + 6%|████▏ | 1011/17840 [1:43:02<32:08:41, 6.88s/it]g-point operations will not be computed-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:43:02<32:08:41, 6.88s/it]g-point operations will not be computed-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:43:02<32:08:41, 6.88s/it]g-point operations will not be computed-17 18:23:47,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:43:09<31:53:45, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:43:09<31:53:45, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:43:09<31:53:45, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:43:15<31:38:52, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:43:15<31:38:52, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:16,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:16,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:43:22<31:42:21, 6.78s/it]g-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:43:22<31:42:21, 6.78s/it]g-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0194, 'learning_rate': 9.992874109263658e-05, 'epoch': 1.14} + 6%|████▏ | 1014/17840 [1:43:22<31:42:21, 6.78s/it]g-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.976, 'learning_rate': 9.99228028503563e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:07,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:43:35<31:18:56, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:43:35<31:18:56, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:43:35<31:18:56, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:43:35<31:18:56, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1017/17840 [1:43:42<31:03:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:42,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:42,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:42,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1018/17840 [1:43:48<30:44:10, 6.58s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:48,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:48,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:48,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:43:55<30:28:14, 6.52s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:55,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:55,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:55,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:44:01<30:23:30, 6.50s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:44:01<30:23:30, 6.50s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:03,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:03,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1021/17840 [1:44:07<30:13:50, 6.47s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1021/17840 [1:44:07<30:13:50, 6.47s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:09,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1022/17840 [1:44:14<29:55:17, 6.40s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1022/17840 [1:44:14<29:55:17, 6.40s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1039, 'learning_rate': 9.98812351543943e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:15,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1023/17840 [1:44:20<29:26:39, 6.30s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1023/17840 [1:44:20<29:26:39, 6.30s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2091, 'learning_rate': 9.987529691211401e-05, 'epoch': 1.15} + 6%|████▏ | 1023/17840 [1:44:20<29:26:39, 6.30s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:23,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:23,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2348, 'learning_rate': 9.986935866983373e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:23,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:23,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:44:34<32:02:42, 6.86s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:44:34<32:02:42, 6.86s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1605, 'learning_rate': 9.986342042755345e-05, 'epoch': 1.15} + 6%|████▏ | 1025/17840 [1:44:34<32:02:42, 6.86s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:37,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:37,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2235, 'learning_rate': 9.985748218527317e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:41,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:41,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1027/17840 [1:44:46<29:34:16, 6.33s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:46,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:46,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:46,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1028/17840 [1:44:52<28:39:32, 6.14s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:51,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:54,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:54,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1808, 'learning_rate': 9.98396674584323e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:58,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1030/17840 [1:45:03<27:13:44, 5.83s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1030/17840 [1:45:03<27:13:44, 5.83s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:02,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:02,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:02,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1031/17840 [1:45:08<26:26:11, 5.66s/it]g-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:07,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:10,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:10,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:12,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:12,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:12,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:34,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1033/17840 [1:45:18<24:45:50, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:26:16,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:18,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:16,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:18,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:16,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1034/17840 [1:45:22<23:45:36, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:23,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1035/17840 [1:45:27<22:36:55, 4.84s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1035/17840 [1:45:27<22:36:55, 4.84s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:26,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:28,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:28,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:30,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:30,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:31,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:35,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:35,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:36,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:36,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:39,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:40,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:40,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:42,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:42,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:44,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:44,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1951, 'learning_rate': 9.97624703087886e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:48,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:48,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:52,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:52,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3931, 'learning_rate': 9.975653206650832e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:56,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:56,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:56,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:00,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:00,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:00,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:07,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:07,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2324, 'learning_rate': 9.974465558194775e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:07,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:07,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:46:18<29:36:58, 6.35s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:46:18<29:36:58, 6.35s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2482, 'learning_rate': 9.973871733966747e-05, 'epoch': 1.17} + 6%|████▎ | 1046/17840 [1:46:18<29:36:58, 6.35s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:46:18<29:36:58, 6.35s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:46:18<29:36:58, 6.35s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:46:25<31:01:07, 6.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:46:25<31:01:07, 6.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:46:25<31:01:07, 6.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:29,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:29,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0283, 'learning_rate': 9.97268408551069e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:29,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:29,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:29,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:39<32:26:31, 6.96s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:39<32:26:31, 6.96s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:39<32:26:31, 6.96s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:39<32:26:31, 6.96s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:39<32:26:31, 6.96s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:46:49<36:18:28, 7.78s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:50,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:50,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█���██▎ | 1051/17840 [1:46:57<35:40:56, 7.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1051/17840 [1:46:57<35:40:56, 7.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1909, 'learning_rate': 9.970902612826603e-05, 'epoch': 1.18} + 6%|████▎ | 1051/17840 [1:46:57<35:40:56, 7.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1051/17840 [1:46:57<35:40:56, 7.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1051/17840 [1:46:57<35:40:56, 7.65s/it]g-point operations will not be computed-17 18:26:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:47:04<34:52:40, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:47:04<34:52:40, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:47:04<34:52:40, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:47:11<34:17:18, 7.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:47:11<34:17:18, 7.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1967, 'learning_rate': 9.969714964370547e-05, 'epoch': 1.18} + 6%|████▎ | 1053/17840 [1:47:11<34:17:18, 7.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:47:11<34:17:18, 7.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:47:11<34:17:18, 7.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:02,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:47:18<33:50:22, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:47:18<33:50:22, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:47:18<33:50:22, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1055/17840 [1:47:25<33:26:33, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1055/17840 [1:47:25<33:26:33, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4234, 'learning_rate': 9.96852731591449e-05, 'epoch': 1.18} + 6%|████▎ | 1055/17840 [1:47:25<33:26:33, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:28,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:28,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2989, 'learning_rate': 9.96793349168646e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:28,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:28,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:28,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:47:38<32:45:00, 7.03s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:39,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:39,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:39,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:47:45<32:31:11, 6.98s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:47:45<32:31:11, 6.98s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:47:45<32:31:11, 6.98s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:49,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:49,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7881, 'learning_rate': 9.966152019002377e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:49,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:49,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:49,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1060/17840 [1:47:59<32:00:10, 6.87s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:59,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:59,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:59,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1061/17840 [1:48:06<31:49:01, 6.83s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1061/17840 [1:48:06<31:49:01, 6.83s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:08,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:08,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:48:12<31:39:00, 6.79s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:48:12<31:39:00, 6.79s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:48:12<31:39:00, 6.79s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3554, 'learning_rate': 9.963776722090262e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:16,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:48:26<31:27:27, 6.75s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1065/17840 [1:48:32<31:09:21, 6.69s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1065/17840 [1:48:32<31:09:21, 6.69s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:34,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:34,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:48:39<30:55:01, 6.64s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:48:39<30:55:01, 6.64s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:48:39<30:55:01, 6.64s/it]g-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:42,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:42,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0641, 'learning_rate': 9.961401425178148e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:42,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:42,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:42,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:28:16,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:48:52<30:35:05, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:50,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:48:52<30:35:05, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:50,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:48:52<30:35:05, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:50,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:48:52<30:35:05, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:50,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:48:58<30:23:05, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:57,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:48:58<30:23:05, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:57,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:48:58<30:23:05, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:57,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:48:58<30:23:05, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:57,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:49:05<30:09:55, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:49:05<30:09:55, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:49:05<30:09:55, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:49:05<30:09:55, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1071/17840 [1:49:11<29:57:32, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:11,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:11,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:11,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1072/17840 [1:49:17<29:47:20, 6.40s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:17,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:17,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1073/17840 [1:49:23<29:28:26, 6.33s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1073/17840 [1:49:23<29:28:26, 6.33s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:23,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:23,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:23,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1074/17840 [1:49:29<29:08:32, 6.26s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:29,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:29,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:49:38<31:58:02, 6.86s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:49:38<31:58:02, 6.86s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:38,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:38,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:38,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1076/17840 [1:49:44<30:38:37, 6.58s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:43,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:43,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:43,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1077/17840 [1:49:49<29:28:59, 6.33s/it]g-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:49,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:49,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:49,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:03,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1078/17840 [1:49:55<28:39:33, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1078/17840 [1:49:55<28:39:33, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:58,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:58,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4258, 'learning_rate': 9.954275534441807e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:02,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1080/17840 [1:50:06<27:00:14, 5.80s/it]g-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1080/17840 [1:50:06<27:00:14, 5.80s/it]g-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:06,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:08,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:08,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5368, 'learning_rate': 9.953087885985749e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:12,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1082/17840 [1:50:16<25:25:29, 5.46s/it]g-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1082/17840 [1:50:16<25:25:29, 5.46s/it]g-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:16,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:18,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:18,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:21,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:21,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:21,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:54,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1084/17840 [1:50:26<23:37:17, 5.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:24,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1085/17840 [1:50:30<22:29:47, 4.83s/it]g-point operations will not be computed-17 18:31:24,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1085/17840 [1:50:30<22:29:47, 4.83s/it]g-point operations will not be computed-17 18:31:24,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1085/17840 [1:50:30<22:29:47, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:28,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:50:34<21:24:15, 4.60s/it]g-point operations will not be computed-17 18:31:28,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:50:34<21:24:15, 4.60s/it]g-point operations will not be computed-17 18:31:28,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:50:34<21:24:15, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:32,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:50:34<21:24:15, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:32,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:50:38<20:05:58, 4.32s/it]g-point operations will not be computed-17 18:31:32,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:37,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:37,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1088/17840 [1:50:41<18:42:02, 4.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:39,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:40,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:39,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:40,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:39,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1089/17840 [1:50:44<17:23:00, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:42,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1089/17840 [1:50:44<17:23:00, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:42,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1090/17840 [1:50:47<16:05:04, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:45,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1090/17840 [1:50:47<16:05:04, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:45,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1091/17840 [1:50:49<14:36:07, 3.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:47,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1091/17840 [1:50:49<14:36:07, 3.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:47,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:50:52<13:17:10, 2.86s/it]g-point operations will not be computed-17 18:31:47,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:50:52<13:17:10, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:50:52<13:17:10, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:55,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:55,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:51:00<20:21:07, 4.37s/it]g-point operations will not be computed-17 18:31:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:51:00<20:21:07, 4.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:51:00<20:21:07, 4.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:02,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:02,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:51:07<24:53:51, 5.35s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:51:07<24:53:51, 5.35s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:51:07<24:53:51, 5.35s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:51:07<24:53:51, 5.35s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:51:07<24:53:51, 5.35s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:51:15<27:51:32, 5.99s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:15,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:15,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:15,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:51:22<29:51:16, 6.42s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:51:22<29:51:16, 6.42s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:51:22<29:51:16, 6.42s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:51:22<29:51:16, 6.42s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:51:22<29:51:16, 6.42s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:51:29<31:11:28, 6.71s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:51:29<31:11:28, 6.71s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:51:29<31:11:28, 6.71s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:34,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:34,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.312, 'learning_rate': 9.942992874109263e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:34,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:34,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:34,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:51:44<32:34:15, 7.00s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:51:44<32:34:15, 7.00s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:51:44<32:34:15, 7.00s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:51:44<32:34:15, 7.00s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:51:44<32:34:15, 7.00s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:51:54<36:24:52, 7.83s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:51:54<36:24:52, 7.83s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:51:54<36:24:52, 7.83s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:58,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:58,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5535, 'learning_rate': 9.941211401425179e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:58,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:58,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:58,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:52:08<34:50:55, 7.50s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:52:08<34:50:55, 7.50s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:52:08<34:50:55, 7.50s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:12,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:12,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1872, 'learning_rate': 9.940023752969122e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:12,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:12,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:12,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:52:22<33:43:01, 7.25s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:52:29<33:20:03, 7.17s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:52:29<33:20:03, 7.17s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:52:29<33:20:03, 7.17s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:52:29<33:20:03, 7.17s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:52:29<33:20:03, 7.17s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:52:36<33:00:22, 7.10s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:52:43<32:41:40, 7.03s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:52:43<32:41:40, 7.03s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:45,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:52:50<32:26:34, 6.98s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:52:50<32:26:34, 6.98s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2115, 'learning_rate': 9.93705463182898e-05, 'epoch': 1.24} + 6%|████▌ | 1108/17840 [1:52:50<32:26:34, 6.98s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:52:50<32:26:34, 6.98s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:52:50<32:26:34, 6.98s/it]g-point operations will not be computed-17 18:31:58,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:52:57<32:15:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:52:57<32:15:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:52:57<32:15:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:53:04<32:04:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:53:04<32:04:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3808, 'learning_rate': 9.935866983372922e-05, 'epoch': 1.24} + 6%|████▌ | 1110/17840 [1:53:04<32:04:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:07,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:07,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2319, 'learning_rate': 9.935273159144893e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:07,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:07,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:07,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1112/17840 [1:53:17<31:41:43, 6.82s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:17,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:17,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:17,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:53:24<31:30:41, 6.78s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:53:24<31:30:41, 6.78s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:26,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1114/17840 [1:53:30<31:22:26, 6.75s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1114/17840 [1:53:30<31:22:26, 6.75s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3834, 'learning_rate': 9.933491686460809e-05, 'epoch': 1.25} + 6%|████▌ | 1114/17840 [1:53:30<31:22:26, 6.75s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:34,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:34,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.143, 'learning_rate': 9.93289786223278e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:34,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:34,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:34,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1116/17840 [1:53:44<31:04:31, 6.69s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:44,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:44,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:44,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:53:50<30:51:23, 6.64s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:50,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:50,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:53:57<30:35:13, 6.58s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:53:57<30:35:13, 6.58s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7334, 'learning_rate': 9.931116389548694e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:58,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:54:03<30:19:46, 6.53s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:54:03<30:19:46, 6.53s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2503, 'learning_rate': 9.930522565320666e-05, 'epoch': 1.25} + 6%|████▌ | 1119/17840 [1:54:03<30:19:46, 6.53s/it]g-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:06,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:06,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9444, 'learning_rate': 9.929928741092637e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:06,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:06,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:06,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:55,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:54:16<29:55:24, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:54:16<29:55:24, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3387, 'learning_rate': 9.92874109263658e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:14,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1123/17840 [1:54:28<29:23:21, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:27,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1123/17840 [1:54:28<29:23:21, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:27,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1123/17840 [1:54:28<29:23:21, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:27,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1123/17840 [1:54:28<29:23:21, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:27,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1124/17840 [1:54:34<29:02:34, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:33,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1124/17840 [1:54:34<29:02:34, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:33,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1124/17840 [1:54:34<29:02:34, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:33,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1124/17840 [1:54:34<29:02:34, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:33,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:54:43<31:46:56, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:54:43<31:46:56, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:45,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:45,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1443, 'learning_rate': 9.926365795724466e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:45,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:51,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:51,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3163, 'learning_rate': 9.925771971496437e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:55,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1128/17840 [1:55:00<28:33:11, 6.15s/it]g-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1128/17840 [1:55:00<28:33:11, 6.15s/it]g-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:00,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:00,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:41,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:55:06<27:44:03, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:55:06<27:44:03, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2916, 'learning_rate': 9.92458432304038e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:08,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:08,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2584, 'learning_rate': 9.923990498812352e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:12,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:12,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1131/17840 [1:55:16<26:13:13, 5.65s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:16,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:18,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:18,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9781, 'learning_rate': 9.922802850356295e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:22,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:22,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1133/17840 [1:55:26<24:19:59, 5.24s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:25,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:25,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:27,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:29,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:29,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:31,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:33,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:33,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:35,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:37,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:37,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:40,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:40,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:42,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:44,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:44,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:46,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:46,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:48,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:48,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:49,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:49,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:52,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:52,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:59,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:59,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:03,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:03,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:03,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:07,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:56:17<27:12:56, 5.87s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:56:17<27:12:56, 5.87s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:56:17<27:12:56, 5.87s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:56:17<27:12:56, 5.87s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:56:17<27:12:56, 5.87s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:56:25<29:10:04, 6.29s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:56:25<29:10:04, 6.29s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:56:25<29:10:04, 6.29s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:29,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:29,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2615, 'learning_rate': 9.913895486935868e-05, 'epoch': 1.29} +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:29,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:29,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:29,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:39<31:37:28, 6.82s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:39<31:37:28, 6.82s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:39<31:37:28, 6.82s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:39<31:37:28, 6.82s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:39<31:37:28, 6.82s/it]g-point operations will not be computed-17 18:36:04,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:46<32:05:26, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:46<32:05:26, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:46<32:05:26, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:46<32:05:26, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:56:56<35:51:55, 7.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:56:56<35:51:55, 7.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:56:56<35:51:55, 7.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:56:56<35:51:55, 7.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:56:56<35:51:55, 7.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:57:03<35:09:45, 7.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:57:03<35:09:45, 7.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:57:03<35:09:45, 7.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:07,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:07,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1517, 'learning_rate': 9.910926365795726e-05, 'epoch': 1.29} +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:07,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:07,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:07,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:57:18<34:06:41, 7.36s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:57:18<34:06:41, 7.36s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:20,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:57:25<33:39:05, 7.26s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:57:25<33:39:05, 7.26s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5159, 'learning_rate': 9.909738717339669e-05, 'epoch': 1.29} + 6%|████▋ | 1154/17840 [1:57:25<33:39:05, 7.26s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:57:25<33:39:05, 7.26s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:57:25<33:39:05, 7.26s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:57:32<33:18:51, 7.19s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:57:32<33:18:51, 7.19s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:34,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:34,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1156/17840 [1:57:39<32:58:19, 7.11s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1156/17840 [1:57:39<32:58:19, 7.11s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1156/17840 [1:57:39<32:58:19, 7.11s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:42,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:42,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4424, 'learning_rate': 9.907957244655582e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:42,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:42,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:42,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:57:52<32:17:42, 6.97s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:53,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:53,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:57:59<31:56:37, 6.89s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:57:59<31:56:37, 6.89s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2301, 'learning_rate': 9.906769596199526e-05, 'epoch': 1.3} + 6%|████▋ | 1159/17840 [1:57:59<31:56:37, 6.89s/it]g-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8967, 'learning_rate': 9.906175771971497e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:45,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1161/17840 [1:58:13<31:42:28, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1161/17840 [1:58:13<31:42:28, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1161/17840 [1:58:13<31:42:28, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:58:19<31:27:22, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:58:19<31:27:22, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1486, 'learning_rate': 9.90498812351544e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:21,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:58:26<31:12:59, 6.74s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:58:26<31:12:59, 6.74s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2477, 'learning_rate': 9.904394299287411e-05, 'epoch': 1.3} + 7%|████▊ | 1163/17840 [1:58:26<31:12:59, 6.74s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:29,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:29,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4886, 'learning_rate': 9.903800475059382e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:29,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:29,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:29,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1165/17840 [1:58:39<30:42:20, 6.63s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:39,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:39,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:39,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:58:45<30:32:50, 6.60s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:46,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:46,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:58:52<30:23:43, 6.56s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:58:52<30:23:43, 6.56s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2411, 'learning_rate': 9.902019002375298e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:54,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:58:58<30:06:28, 6.50s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:58:58<30:06:28, 6.50s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0987, 'learning_rate': 9.901425178147269e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:00,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1169/17840 [1:59:05<29:55:55, 6.46s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1169/17840 [1:59:05<29:55:55, 6.46s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3283, 'learning_rate': 9.90083135391924e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:06,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:59:11<29:48:19, 6.44s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:59:11<29:48:19, 6.44s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7135, 'learning_rate': 9.900237529691212e-05, 'epoch': 1.31} + 7%|████▊ | 1170/17840 [1:59:11<29:48:19, 6.44s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:59:11<29:48:19, 6.44s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:59:11<29:48:19, 6.44s/it]g-point operations will not be computed-17 18:39:11,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:59:17<29:35:36, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:16,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:59:17<29:35:36, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:16,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:59:17<29:35:36, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:16,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:59:17<29:35:36, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:16,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:59:24<29:31:05, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:22,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:59:24<29:31:05, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:22,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:59:24<29:31:05, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:22,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:59:24<29:31:05, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:22,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:59:30<29:14:43, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:28,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:59:30<29:14:43, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:28,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:33,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:28,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:33,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:28,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3509, 'learning_rate': 9.897862232779098e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:33,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:28,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:33,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:28,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:59:44<31:46:50, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:43,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:59:44<31:46:50, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:43,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4633, 'learning_rate': 9.897268408551069e-05, 'epoch': 1.32} + 7%|████▊ | 1175/17840 [1:59:44<31:46:50, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:43,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:59:44<31:46:50, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:43,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1176/17840 [1:59:50<30:29:56, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1176/17840 [1:59:50<30:29:56, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:53,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:53,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5417, 'learning_rate': 9.896080760095012e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:57,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1178/17840 [2:00:02<28:28:56, 6.15s/it]g-point operations will not be computed-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1178/17840 [2:00:02<28:28:56, 6.15s/it]g-point operations will not be computed-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2256, 'learning_rate': 9.895486935866984e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:03,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1179/17840 [2:00:07<27:37:28, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1179/17840 [2:00:07<27:37:28, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4898, 'learning_rate': 9.894893111638956e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:10,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:10,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2115, 'learning_rate': 9.894299287410927e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:10,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:15,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:15,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:17,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:17,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:06,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1182/17840 [2:00:23<25:00:26, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1182/17840 [2:00:23<25:00:26, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:23,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:23,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1183/17840 [2:00:27<24:07:06, 5.21s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:27,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:27,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:29,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:31,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:31,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:33,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:35,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:35,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:37,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:39,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:39,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:40,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:40,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:43,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:45,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:45,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:48,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:48,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:50,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:50,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:51,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:51,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:53,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:53,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:57,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:57,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:57,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:01,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:01,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:05,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:05,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:05,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:09,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:09,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:09,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:16,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:16,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2639, 'learning_rate': 9.885391923990499e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:16,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:16,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:16,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:01:27<29:24:19, 6.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:01:27<29:24:19, 6.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:01:27<29:24:19, 6.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:01:27<29:24:19, 6.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:01:27<29:24:19, 6.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [2:01:34<30:58:39, 6.70s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:35,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:35,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [2:01:41<31:52:19, 6.89s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [2:01:41<31:52:19, 6.89s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3298, 'learning_rate': 9.883610451306414e-05, 'epoch': 1.34} + 7%|████▉ | 1198/17840 [2:01:41<31:52:19, 6.89s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [2:01:41<31:52:19, 6.89s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [2:01:41<31:52:19, 6.89s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [2:01:49<32:22:45, 7.00s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [2:01:49<32:22:45, 7.00s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:51,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [2:01:58<36:12:10, 7.83s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [2:01:58<36:12:10, 7.83s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0988, 'learning_rate': 9.882422802850356e-05, 'epoch': 1.35} + 7%|████▉ | 1200/17840 [2:01:58<36:12:10, 7.83s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [2:01:58<36:12:10, 7.83s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [2:01:58<36:12:10, 7.83s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:02:06<35:28:11, 7.67s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:02:06<35:28:11, 7.67s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:02:06<35:28:11, 7.67s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:02:06<35:28:11, 7.67s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:02:06<35:28:11, 7.67s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1202/17840 [2:02:13<34:47:32, 7.53s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:13,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:13,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:13,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [2:02:20<34:02:03, 7.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [2:02:20<34:02:03, 7.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [2:02:20<34:02:03, 7.36s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:24,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:24,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2956, 'learning_rate': 9.880047505938242e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:24,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:24,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1205/17840 [2:02:34<33:15:31, 7.20s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1205/17840 [2:02:34<33:15:31, 7.20s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2588, 'learning_rate': 9.879453681710214e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:36,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [2:02:41<32:58:12, 7.14s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [2:02:41<32:58:12, 7.14s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2632, 'learning_rate': 9.878859857482186e-05, 'epoch': 1.35} + 7%|████▉ | 1206/17840 [2:02:41<32:58:12, 7.14s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [2:02:41<32:58:12, 7.14s/it]g-point operations will not be computed-17 18:41:21,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [2:02:48<32:29:34, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [2:02:48<32:29:34, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4268, 'learning_rate': 9.878266033254158e-05, 'epoch': 1.35} + 7%|████▉ | 1207/17840 [2:02:48<32:29:34, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [2:02:55<32:02:10, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [2:02:55<32:02:10, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4228, 'learning_rate': 9.877672209026129e-05, 'epoch': 1.35} + 7%|████▉ | 1208/17840 [2:02:55<32:02:10, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.237, 'learning_rate': 9.877078384798101e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:46,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [2:03:08<31:46:16, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [2:03:08<31:46:16, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4958, 'learning_rate': 9.876484560570071e-05, 'epoch': 1.36} + 7%|████▉ | 1210/17840 [2:03:08<31:46:16, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [2:03:15<31:32:53, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [2:03:15<31:32:53, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1795, 'learning_rate': 9.875890736342042e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:17,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [2:03:22<31:25:55, 6.81s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [2:03:22<31:25:55, 6.81s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1613, 'learning_rate': 9.875296912114015e-05, 'epoch': 1.36} + 7%|████▉ | 1212/17840 [2:03:22<31:25:55, 6.81s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:25,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:25,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:25,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8176, 'learning_rate': 9.874703087885986e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:25,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1214/17840 [2:03:35<31:11:23, 6.75s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1214/17840 [2:03:35<31:11:23, 6.75s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:35,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:35,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [2:03:42<31:02:19, 6.72s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█���██▉ | 1215/17840 [2:03:42<31:02:19, 6.72s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1957, 'learning_rate': 9.873515439429929e-05, 'epoch': 1.36} + 7%|████▉ | 1215/17840 [2:03:42<31:02:19, 6.72s/it]g-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:45,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:45,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3805, 'learning_rate': 9.872921615201901e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:45,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:45,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:07,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [2:03:55<30:40:23, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [2:03:55<30:40:23, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1104, 'learning_rate': 9.872327790973872e-05, 'epoch': 1.36} + 7%|████▉ | 1217/17840 [2:03:55<30:40:23, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [2:04:01<30:20:37, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [2:04:01<30:20:37, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:01,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:01,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [2:04:08<30:09:37, 6.53s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [2:04:08<30:09:37, 6.53s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3022, 'learning_rate': 9.871140142517816e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:09,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [2:04:14<30:00:55, 6.50s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [2:04:14<30:00:55, 6.50s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4021, 'learning_rate': 9.870546318289786e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:16,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [2:04:20<29:48:23, 6.46s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [2:04:20<29:48:23, 6.46s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4757, 'learning_rate': 9.869952494061758e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:22,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [2:04:27<29:31:30, 6.40s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [2:04:27<29:31:30, 6.40s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6417, 'learning_rate': 9.869358669833729e-05, 'epoch': 1.37} + 7%|█████ | 1222/17840 [2:04:27<29:31:30, 6.40s/it]g-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:30,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:30,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2654, 'learning_rate': 9.868764845605701e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:30,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:36,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:36,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.345, 'learning_rate': 9.868171021377672e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:36,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:36,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:36,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:53,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [2:04:48<32:01:45, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [2:04:48<32:01:45, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [2:04:48<32:01:45, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:50,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:50,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:50,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:50,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:56,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:56,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:01,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:01,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [2:05:05<28:39:07, 6.21s/it]g-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [2:05:05<28:39:07, 6.21s/it]g-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:06,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:06,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [2:05:11<27:52:56, 6.04s/it]g-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:10,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:13,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:13,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.965, 'learning_rate': 9.864608076009501e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:17,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:17,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [2:05:22<26:17:15, 5.70s/it]g-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:21,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:21,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:21,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1232/17840 [2:05:27<25:35:42, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:27,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:27,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1233/17840 [2:05:32<24:43:46, 5.36s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:31,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:33,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:33,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:35,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:37,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:37,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:40,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:41,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:41,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:43,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:45,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:45,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:47,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:47,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:48,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:50,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:50,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:53,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:53,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:54,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:54,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:57,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:57,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:59,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:59,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:03,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:03,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:03,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:07,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:07,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:11,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:11,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:11,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:06:17<24:24:04, 5.29s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:06:17<24:24:04, 5.29s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:06:17<24:24:04, 5.29s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:22,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:22,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6945, 'learning_rate': 9.855700712589074e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:22,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:22,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:22,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:06:32<29:19:10, 6.36s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:06:32<29:19:10, 6.36s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:06:32<29:19:10, 6.36s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:06:32<29:19:10, 6.36s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:06:32<29:19:10, 6.36s/it]g-point operations will not be computed-17 18:46:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:39<30:31:25, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:39<30:31:25, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:39<30:31:25, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:39<30:31:25, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:06:47<31:30:35, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:06:47<31:30:35, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:06:47<31:30:35, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:06:47<31:30:35, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:06:47<31:30:35, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:06:54<32:00:06, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:55,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:55,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:07:04<35:37:09, 7.73s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:07:04<35:37:09, 7.73s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2715, 'learning_rate': 9.852731591448931e-05, 'epoch': 1.4} + 7%|█████ | 1250/17840 [2:07:04<35:37:09, 7.73s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:07:04<35:37:09, 7.73s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:07:04<35:37:09, 7.73s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:07:11<34:53:21, 7.57s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:07:11<34:53:21, 7.57s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:13,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:07:18<34:19:03, 7.45s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:07:18<34:19:03, 7.45s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1963, 'learning_rate': 9.851543942992875e-05, 'epoch': 1.4} + 7%|█████ | 1252/17840 [2:07:18<34:19:03, 7.45s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:07:18<34:19:03, 7.45s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:07:18<34:19:03, 7.45s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1253/17840 [2:07:25<33:41:16, 7.31s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1253/17840 [2:07:25<33:41:16, 7.31s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:27,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:07:32<33:13:53, 7.21s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:07:32<33:13:53, 7.21s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3615, 'learning_rate': 9.850356294536818e-05, 'epoch': 1.41} + 7%|█████▏ | 1254/17840 [2:07:32<33:13:53, 7.21s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:07:32<33:13:53, 7.21s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:07:32<33:13:53, 7.21s/it]g-point operations will not be computed-17 18:47:38,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:07:39<32:54:45, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:07:39<32:54:45, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:07:39<32:54:45, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1256/17840 [2:07:46<32:41:58, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1256/17840 [2:07:46<32:41:58, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0018, 'learning_rate': 9.84916864608076e-05, 'epoch': 1.41} + 7%|█████▏ | 1256/17840 [2:07:46<32:41:58, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:50,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:50,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5088, 'learning_rate': 9.848574821852731e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:50,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:50,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:08:00<32:10:38, 6.99s/it]g-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:08:00<32:10:38, 6.99s/it]g-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:00,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:00,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:08:07<32:08:40, 6.98s/it]g-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:08:07<32:08:40, 6.98s/it]g-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2287, 'learning_rate': 9.847387173396675e-05, 'epoch': 1.41} + 7%|█████▏ | 1259/17840 [2:08:07<32:08:40, 6.98s/it]g-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:08:07<32:08:40, 6.98s/it]g-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:08:07<32:08:40, 6.98s/it]g-point operations will not be computed-17 18:48:38,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [2:08:13<31:58:09, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [2:08:13<31:58:09, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [2:08:13<31:58:09, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [2:08:20<31:46:16, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [2:08:20<31:46:16, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4429, 'learning_rate': 9.846199524940618e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:22,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:08:27<31:34:55, 6.86s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:08:27<31:34:55, 6.86s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4097, 'learning_rate': 9.845605700712589e-05, 'epoch': 1.41} + 7%|█████▏ | 1262/17840 [2:08:27<31:34:55, 6.86s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:31,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:31,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0375, 'learning_rate': 9.845011876484561e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:31,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:31,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:08:40<31:19:04, 6.80s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:08:40<31:19:04, 6.80s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9689, 'learning_rate': 9.844418052256532e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:42,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [2:08:47<30:57:48, 6.73s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [2:08:47<30:57:48, 6.73s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2414, 'learning_rate': 9.843824228028504e-05, 'epoch': 1.42} + 7%|█████▏ | 1265/17840 [2:08:47<30:57:48, 6.73s/it]g-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:50,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:50,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2558, 'learning_rate': 9.843230403800476e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:50,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:57,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:57,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0658, 'learning_rate': 9.842636579572448e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:57,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:57,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:57,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:49:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [2:09:07<30:17:31, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:05,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [2:09:07<30:17:31, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:05,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [2:09:07<30:17:31, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:05,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [2:09:07<30:17:31, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:05,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1269/17840 [2:09:13<30:00:33, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1269/17840 [2:09:13<30:00:33, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1269/17840 [2:09:13<30:00:33, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1269/17840 [2:09:13<30:00:33, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1270/17840 [2:09:19<29:48:16, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:19,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:19,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:19,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [2:09:26<29:32:24, 6.42s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [2:09:26<29:32:24, 6.42s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:27,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:27,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [2:09:32<29:16:19, 6.36s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [2:09:32<29:16:19, 6.36s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:33,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:33,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1273/17840 [2:09:38<29:06:22, 6.32s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1273/17840 [2:09:38<29:06:22, 6.32s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:40,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:40,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:09:44<28:59:39, 6.30s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:09:44<28:59:39, 6.30s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:46,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1275/17840 [2:09:53<31:50:34, 6.92s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1275/17840 [2:09:53<31:50:34, 6.92s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3169, 'learning_rate': 9.837885985748219e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:54,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:54,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1276/17840 [2:09:59<30:32:10, 6.64s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1276/17840 [2:09:59<30:32:10, 6.64s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:00,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:00,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1277/17840 [2:10:04<29:26:37, 6.40s/it]g-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:04,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:04,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:04,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:11,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1278/17840 [2:10:10<28:25:24, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1278/17840 [2:10:10<28:25:24, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:13,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:13,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2, 'learning_rate': 9.835510688836105e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:17,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1280/17840 [2:10:21<26:53:07, 5.84s/it]g-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1280/17840 [2:10:21<26:53:07, 5.84s/it]g-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:21,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:21,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:21,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:09,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [2:10:27<26:11:11, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [2:10:27<26:11:11, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:29,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:29,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1209, 'learning_rate': 9.833729216152019e-05, 'epoch': 1.44} +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:32,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:32,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1283/17840 [2:10:37<24:48:19, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1283/17840 [2:10:37<24:48:19, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:41,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:43,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:43,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:45,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:47,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:47,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:49,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:51,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:51,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:52,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:52,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:54,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:57,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:57,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:59,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:59,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:01,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:02,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:02,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:05,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:05,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7096, 'learning_rate': 9.827790973871735e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:12,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:12,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:16,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:16,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:16,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:11:23<24:18:44, 5.29s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:11:23<24:18:44, 5.29s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:11:23<24:18:44, 5.29s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.423, 'learning_rate': 9.826009501187648e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:38<29:17:32, 6.37s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:38<29:17:32, 6.37s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:38<29:17:32, 6.37s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:38<29:17:32, 6.37s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:38<29:17:32, 6.37s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1297/17840 [2:11:45<30:39:26, 6.67s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1297/17840 [2:11:45<30:39:26, 6.67s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:48,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:53<31:37:13, 6.88s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:53<31:37:13, 6.88s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.11, 'learning_rate': 9.824228028503563e-05, 'epoch': 1.46} + 7%|█████▎ | 1298/17840 [2:11:53<31:37:13, 6.88s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:53<31:37:13, 6.88s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:53<31:37:13, 6.88s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1299/17840 [2:12:00<32:14:51, 7.02s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1299/17840 [2:12:00<32:14:51, 7.02s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:02,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:02,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:02,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.253, 'learning_rate': 9.823040380047507e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:02,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:02,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:12:17<34:56:57, 7.61s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:12:17<34:56:57, 7.61s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2895, 'learning_rate': 9.822446555819478e-05, 'epoch': 1.46} + 7%|█████▎ | 1301/17840 [2:12:17<34:56:57, 7.61s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.48, 'learning_rate': 9.82185273159145e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:12:31<33:36:48, 7.32s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:12:31<33:36:48, 7.32s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2685, 'learning_rate': 9.82125890736342e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:33,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [2:12:38<33:15:15, 7.24s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [2:12:38<33:15:15, 7.24s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3637, 'learning_rate': 9.820665083135391e-05, 'epoch': 1.46} + 7%|█████▎ | 1304/17840 [2:12:38<33:15:15, 7.24s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [2:12:38<33:15:15, 7.24s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [2:12:45<33:01:14, 7.19s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [2:12:45<33:01:14, 7.19s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:45,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:45,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:12:52<32:46:16, 7.14s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:12:52<32:46:16, 7.14s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2033, 'learning_rate': 9.819477434679335e-05, 'epoch': 1.46} + 7%|█████▎ | 1306/17840 [2:12:52<32:46:16, 7.14s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:56,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:56,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:56,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:59,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:59,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:13:06<32:15:52, 7.03s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:13:06<32:15:52, 7.03s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1901, 'learning_rate': 9.818289786223278e-05, 'epoch': 1.47} + 7%|█████▎ | 1308/17840 [2:13:06<32:15:52, 7.03s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:10,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:10,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1616, 'learning_rate': 9.81769596199525e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:10,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:10,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1310/17840 [2:13:20<31:57:07, 6.96s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1310/17840 [2:13:20<31:57:07, 6.96s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2589, 'learning_rate': 9.817102137767221e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:22,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [2:13:26<31:42:46, 6.91s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [2:13:26<31:42:46, 6.91s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4206, 'learning_rate': 9.816508313539193e-05, 'epoch': 1.47} + 7%|█████▎ | 1311/17840 [2:13:26<31:42:46, 6.91s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [2:13:26<31:42:46, 6.91s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [2:13:26<31:42:46, 6.91s/it]g-point operations will not be computed-17 18:51:35,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:13:33<31:40:29, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:13:33<31:40:29, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:13:33<31:40:29, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:13:40<31:30:55, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:13:40<31:30:55, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:40,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:40,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:40,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:13:47<31:19:07, 6.82s/it]g-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:13:47<31:19:07, 6.82s/it]g-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:13:47<31:19:07, 6.82s/it]g-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:13:47<31:19:07, 6.82s/it]g-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:32,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1316/17840 [2:14:00<30:48:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1316/17840 [2:14:00<30:48:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1316/17840 [2:14:00<30:48:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1316/17840 [2:14:00<30:48:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1317/17840 [2:14:07<30:41:31, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:07,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:07,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:07,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:14:13<30:28:13, 6.64s/it]g-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:13,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:13,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:13,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:14:20<30:10:48, 6.58s/it]g-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:14:20<30:10:48, 6.58s/it]g-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:21,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:21,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:14:26<29:49:23, 6.50s/it]g-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:14:26<29:49:23, 6.50s/it]g-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:14:26<29:49:23, 6.50s/it]g-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:14:26<29:49:23, 6.50s/it]g-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:29,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:29,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:29,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:35,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:35,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5304, 'learning_rate': 9.80997624703088e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:35,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:42,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:42,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3375, 'learning_rate': 9.80938242280285e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:42,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:42,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:42,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1324/17840 [2:14:51<28:56:50, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1324/17840 [2:14:51<28:56:50, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1324/17840 [2:14:51<28:56:50, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1324/17840 [2:14:51<28:56:50, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:14:59<31:55:17, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:59,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:59,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:59,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1326/17840 [2:15:05<30:44:48, 6.70s/it]g-point operations will not be computed-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:05,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:05,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:05,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1327/17840 [2:15:11<29:35:54, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:10,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1327/17840 [2:15:11<29:35:54, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:10,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1327/17840 [2:15:11<29:35:54, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:10,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1327/17840 [2:15:11<29:35:54, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:10,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1328/17840 [2:15:17<28:47:19, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1328/17840 [2:15:17<28:47:19, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:20,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:20,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5376, 'learning_rate': 9.80581947743468e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:24,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:24,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1330/17840 [2:15:28<27:14:53, 5.94s/it]g-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:28,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:28,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:28,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:16,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [2:15:34<26:25:03, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:32,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [2:15:34<26:25:03, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:32,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [2:15:34<26:25:03, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:32,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:36,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:32,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:36,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:32,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:40,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:32,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:40,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:32,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1333/17840 [2:15:44<24:46:01, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:44,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:44,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1334/17840 [2:15:49<23:35:41, 5.15s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:48,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:48,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:50,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:52,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:52,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:54,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:57,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:00,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:00,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:02,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:02,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:05,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:05,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:06,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:08,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:08,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:10,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:10,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9825, 'learning_rate': 9.79809976247031e-05, 'epoch': 1.5} +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:14,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:14,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:14,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:18,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:18,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:22,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:22,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:22,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:26,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:26,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:26,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:33,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:33,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4219, 'learning_rate': 9.796318289786224e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:33,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:33,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:33,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1346/17840 [2:16:44<29:09:46, 6.37s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1346/17840 [2:16:44<29:09:46, 6.37s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1346/17840 [2:16:44<29:09:46, 6.37s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1346/17840 [2:16:44<29:09:46, 6.37s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1346/17840 [2:16:44<29:09:46, 6.37s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:16:51<30:31:55, 6.66s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:16:51<30:31:55, 6.66s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:54,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:16:58<31:30:50, 6.88s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:16:58<31:30:50, 6.88s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3592, 'learning_rate': 9.794536817102138e-05, 'epoch': 1.51} + 8%|█████▌ | 1348/17840 [2:16:58<31:30:50, 6.88s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:16:58<31:30:50, 6.88s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:16:58<31:30:50, 6.88s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:17:06<32:07:56, 7.01s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:17:06<32:07:56, 7.01s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:08,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:17:15<35:33:41, 7.76s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:17:15<35:33:41, 7.76s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1111, 'learning_rate': 9.79334916864608e-05, 'epoch': 1.51} + 8%|█████▌ | 1350/17840 [2:17:15<35:33:41, 7.76s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:17:15<35:33:41, 7.76s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:17:23<34:50:44, 7.61s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:17:23<34:50:44, 7.61s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2654, 'learning_rate': 9.792755344418053e-05, 'epoch': 1.51} + 8%|█████▌ | 1351/17840 [2:17:23<34:50:44, 7.61s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:17:23<34:50:44, 7.61s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:17:23<34:50:44, 7.61s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:17:30<34:24:26, 7.51s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:30,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:30,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:17:37<33:48:02, 7.38s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:17:37<33:48:02, 7.38s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3113, 'learning_rate': 9.791567695961997e-05, 'epoch': 1.52} + 8%|█████▌ | 1353/17840 [2:17:37<33:48:02, 7.38s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:41,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:41,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2366, 'learning_rate': 9.790973871733967e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:41,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:41,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:51<33:05:45, 7.23s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:51<33:05:45, 7.23s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.344, 'learning_rate': 9.790380047505938e-05, 'epoch': 1.52} + 8%|█████▌ | 1355/17840 [2:17:51<33:05:45, 7.23s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:51<33:05:45, 7.23s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:51<33:05:45, 7.23s/it]g-point operations will not be computed-17 18:56:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:17:58<32:50:42, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:17:58<32:50:42, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:17:58<32:50:42, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1357/17840 [2:18:05<32:30:49, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1357/17840 [2:18:05<32:30:49, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2421, 'learning_rate': 9.789192399049881e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:07,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:18:12<32:14:23, 7.04s/it]g-point operations will not be computed-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:18:12<32:14:23, 7.04s/it]g-point operations will not be computed-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4055, 'learning_rate': 9.788598574821853e-05, 'epoch': 1.52} + 8%|█████▌ | 1358/17840 [2:18:12<32:14:23, 7.04s/it]g-point operations will not be computed-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:18:12<32:14:23, 7.04s/it]g-point operations will not be computed-17 18:58:57,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:18:19<32:01:29, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:18:19<32:01:29, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2082, 'learning_rate': 9.788004750593825e-05, 'epoch': 1.52} + 8%|█████▌ | 1359/17840 [2:18:19<32:01:29, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:18:26<31:43:55, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:18:26<31:43:55, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0587, 'learning_rate': 9.787410926365797e-05, 'epoch': 1.52} + 8%|█████▌ | 1360/17840 [2:18:26<31:43:55, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:29,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:29,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.364, 'learning_rate': 9.786817102137767e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:29,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:29,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1362/17840 [2:18:39<31:34:03, 6.90s/it]g-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1362/17840 [2:18:39<31:34:03, 6.90s/it]g-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:40,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:40,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:18:46<31:20:45, 6.85s/it]g-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:18:46<31:20:45, 6.85s/it]g-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1704, 'learning_rate': 9.78562945368171e-05, 'epoch': 1.53} + 8%|█████▌ | 1363/17840 [2:18:46<31:20:45, 6.85s/it]g-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1557, 'learning_rate': 9.785035629453682e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:56,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:56,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.522, 'learning_rate': 9.784441805225654e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:56,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:56,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:18,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:19:06<30:33:44, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:19:06<30:33:44, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3374, 'learning_rate': 9.783847980997625e-05, 'epoch': 1.53} + 8%|█████▌ | 1366/17840 [2:19:06<30:33:44, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:19:12<30:22:19, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:19:12<30:22:19, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:13,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:13,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:13,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:19:19<30:05:59, 6.58s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:19:19<30:05:59, 6.58s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:21,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:21,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:19:25<29:49:34, 6.52s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:19:25<29:49:34, 6.52s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:27,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1370/17840 [2:19:32<29:37:26, 6.48s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1370/17840 [2:19:32<29:37:26, 6.48s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.956, 'learning_rate': 9.78147268408551e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:33,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1371/17840 [2:19:38<29:33:08, 6.46s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1371/17840 [2:19:38<29:33:08, 6.46s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2859, 'learning_rate': 9.780878859857482e-05, 'epoch': 1.54} + 8%|█████▌ | 1371/17840 [2:19:38<29:33:08, 6.46s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:41,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:41,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1766, 'learning_rate': 9.780285035629454e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:41,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2524, 'learning_rate': 9.779691211401426e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:54,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:54,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1823, 'learning_rate': 9.779097387173397e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:58,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:20:05<31:10:31, 6.82s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:20:05<31:10:31, 6.82s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3626, 'learning_rate': 9.778503562945369e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:06,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1376/17840 [2:20:11<29:48:09, 6.52s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1376/17840 [2:20:11<29:48:09, 6.52s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2324, 'learning_rate': 9.77790973871734e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:12,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:20:16<28:59:11, 6.34s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:20:16<28:59:11, 6.34s/it]g-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0653, 'learning_rate': 9.77731591448931e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:18,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:18,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:00:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:20:22<28:11:11, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:20:22<28:11:11, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:20:22<28:11:11, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:20:22<28:11:11, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:21,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1379/17840 [2:20:28<27:27:25, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1379/17840 [2:20:28<27:27:25, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:30,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:30,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1106, 'learning_rate': 9.775534441805227e-05, 'epoch': 1.55} +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:34,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1381/17840 [2:20:39<25:59:38, 5.69s/it]g-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1381/17840 [2:20:39<25:59:38, 5.69s/it]g-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:38,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:38,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:38,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:26,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1382/17840 [2:20:44<25:10:31, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:42,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:44,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:42,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:44,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:42,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1383/17840 [2:20:49<24:20:25, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1383/17840 [2:20:49<24:20:25, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:50,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:50,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:52,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:54,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:54,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:56,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:58,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:58,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:00,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:02,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:02,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:05,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:05,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:06,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:09,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:09,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:10,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:10,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:13,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:13,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:15,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:15,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6673, 'learning_rate': 9.768408551068884e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:19,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:19,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:23,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:23,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2298, 'learning_rate': 9.767814726840856e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:27,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:27,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:31,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:31,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1461, 'learning_rate': 9.767220902612827e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:31,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:31,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:21:41<27:23:24, 6.00s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:21:41<27:23:24, 6.00s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1686, 'learning_rate': 9.766627078384799e-05, 'epoch': 1.56} + 8%|█████▋ | 1395/17840 [2:21:41<27:23:24, 6.00s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:46,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:46,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2302, 'learning_rate': 9.76603325415677e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:46,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:46,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:21:56<30:39:06, 6.71s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:21:56<30:39:06, 6.71s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2132, 'learning_rate': 9.76543942992874e-05, 'epoch': 1.57} + 8%|█████▋ | 1397/17840 [2:21:56<30:39:06, 6.71s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:21:56<30:39:06, 6.71s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:22:03<31:34:57, 6.92s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:22:03<31:34:57, 6.92s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2186, 'learning_rate': 9.764845605700714e-05, 'epoch': 1.57} + 8%|█████▋ | 1398/17840 [2:22:03<31:34:57, 6.92s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:08,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:08,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1376, 'learning_rate': 9.764251781472685e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:08,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:08,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:22:21<36:06:44, 7.91s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:22:21<36:06:44, 7.91s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4021, 'learning_rate': 9.763657957244657e-05, 'epoch': 1.57} + 8%|█████▋ | 1400/17840 [2:22:21<36:06:44, 7.91s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:22:21<36:06:44, 7.91s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1401/17840 [2:22:28<35:24:29, 7.75s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1401/17840 [2:22:28<35:24:29, 7.75s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1678, 'learning_rate': 9.763064133016627e-05, 'epoch': 1.57} + 8%|█████▋ | 1401/17840 [2:22:28<35:24:29, 7.75s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:32,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:32,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7018, 'learning_rate': 9.762470308788599e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:32,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:32,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:22:42<33:53:39, 7.42s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:22:42<33:53:39, 7.42s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0055, 'learning_rate': 9.76187648456057e-05, 'epoch': 1.57} + 8%|█████▋ | 1403/17840 [2:22:42<33:53:39, 7.42s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:22:42<33:53:39, 7.42s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:46,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:46,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:46,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:46,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:46,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:22:56<33:07:47, 7.26s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:22:56<33:07:47, 7.26s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:59,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:59,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:23:03<32:46:58, 7.18s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:23:03<32:46:58, 7.18s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:23:03<32:46:58, 7.18s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:23:03<32:46:58, 7.18s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:23:03<32:46:58, 7.18s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:23:10<32:30:04, 7.12s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:11,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:11,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:11,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:23:17<32:14:26, 7.06s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:23:17<32:14:26, 7.06s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:23:17<32:14:26, 7.06s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:21,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:21,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0557, 'learning_rate': 9.7583135391924e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:21,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:21,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:21,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:23:31<31:54:01, 6.99s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:23:31<31:54:01, 6.99s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:33,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:33,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:23:38<31:42:19, 6.95s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:23:38<31:42:19, 6.95s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:23:38<31:42:19, 6.95s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:23:38<31:42:19, 6.95s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:23:38<31:42:19, 6.95s/it]g-point operations will not be computed-17 19:01:47,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:23:45<31:29:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:23:45<31:29:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:23:45<31:29:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:23:45<31:29:59, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1413/17840 [2:23:52<31:12:10, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:52,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:52,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:52,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:23:58<31:01:31, 6.80s/it]g-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:23:58<31:01:31, 6.80s/it]g-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:23:58<31:01:31, 6.80s/it]g-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:02,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:02,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1653, 'learning_rate': 9.754750593824229e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:02,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:02,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:02,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:04:43,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:24:12<30:44:02, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:24:12<30:44:02, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:24:12<30:44:02, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:24:12<30:44:02, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1417/17840 [2:24:18<30:33:12, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1417/17840 [2:24:18<30:33:12, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:20,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:20,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:24:25<30:19:11, 6.65s/it]g-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:24:25<30:19:11, 6.65s/it]g-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:24:25<30:19:11, 6.65s/it]g-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:28,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:28,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.267, 'learning_rate': 9.752375296912114e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:28,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:35,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:35,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5154, 'learning_rate': 9.751781472684086e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:35,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:35,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:35,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:10,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:24:44<29:42:40, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:43,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:24:44<29:42:40, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:43,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:24:44<29:42:40, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:43,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:24:44<29:42:40, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:43,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:24:50<29:24:31, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:24:50<29:24:31, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:24:50<29:24:31, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:24:50<29:24:31, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:24:57<29:11:19, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:57,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:57,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:57,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:25:03<28:58:14, 6.35s/it]g-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:03,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:03,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:25:11<31:38:40, 6.94s/it]g-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:25:11<31:38:40, 6.94s/it]g-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:11,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:11,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:11,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1426/17840 [2:25:17<30:33:47, 6.70s/it]g-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:17,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:17,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:17,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1427/17840 [2:25:23<29:27:08, 6.46s/it]g-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:23,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:23,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:23,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:25:29<28:32:25, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:25:29<28:32:25, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:32,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:32,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3202, 'learning_rate': 9.74643705463183e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:36,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:25:40<27:05:02, 5.94s/it]g-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:25:40<27:05:02, 5.94s/it]g-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:40,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:40,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:40,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:28,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1431/17840 [2:25:46<26:16:19, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1431/17840 [2:25:46<26:16:19, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:48,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:48,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4099, 'learning_rate': 9.744655581947744e-05, 'epoch': 1.61} +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:52,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:52,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1433/17840 [2:25:56<24:41:19, 5.42s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:55,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:58,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:58,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:00,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:02,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:02,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:04,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:06,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:06,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:08,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:10,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:10,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:11,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:11,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:13,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:16,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:16,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:18,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:18,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:20,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:20,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:22,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:22,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:23,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:23,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:27,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:31,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:31,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0598, 'learning_rate': 9.73812351543943e-05, 'epoch': 1.62} +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:34,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:34,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:38,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:38,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3116, 'learning_rate': 9.737529691211402e-05, 'epoch': 1.62} +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:38,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:38,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:26:49<26:56:43, 5.92s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:26:49<26:56:43, 5.92s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2834, 'learning_rate': 9.736935866983374e-05, 'epoch': 1.62} +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:51,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:26:56<28:55:52, 6.35s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:26:56<28:55:52, 6.35s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.067, 'learning_rate': 9.736342042755346e-05, 'epoch': 1.62} + 8%|█████▉ | 1446/17840 [2:26:56<28:55:52, 6.35s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:26:56<28:55:52, 6.35s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:27:04<30:20:22, 6.66s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:27:04<30:20:22, 6.66s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0764, 'learning_rate': 9.735748218527316e-05, 'epoch': 1.62} + 8%|█████▉ | 1447/17840 [2:27:04<30:20:22, 6.66s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:27:04<30:20:22, 6.66s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:27:04<30:20:22, 6.66s/it]g-point operations will not be computed-17 19:06:44,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:27:11<31:12:13, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:27:11<31:12:13, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:27:11<31:12:13, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:27:11<31:12:13, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:27:18<31:42:53, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:27:18<31:42:53, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:27:18<31:42:53, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:27:18<31:42:53, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:27:18<31:42:53, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:27:28<35:13:50, 7.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:28,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:28,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:28,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:27:35<34:30:42, 7.58s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:27:35<34:30:42, 7.58s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:27:35<34:30:42, 7.58s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:27:35<34:30:42, 7.58s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:27:35<34:30:42, 7.58s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1452/17840 [2:27:42<33:54:21, 7.45s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:42,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:42,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:42,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:27:49<33:32:17, 7.37s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:27:49<33:32:17, 7.37s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:27:49<33:32:17, 7.37s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:27:49<33:32:17, 7.37s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:27:49<33:32:17, 7.37s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1454/17840 [2:27:56<33:12:45, 7.30s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:57,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:57,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:57,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:28:03<32:49:22, 7.21s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:28:03<32:49:22, 7.21s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:28:03<32:49:22, 7.21s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:07,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:07,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1705, 'learning_rate': 9.73040380047506e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:07,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:07,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:07,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1457/17840 [2:28:17<32:09:33, 7.07s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1457/17840 [2:28:17<32:09:33, 7.07s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1457/17840 [2:28:17<32:09:33, 7.07s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:21,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:21,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.017, 'learning_rate': 9.729216152019003e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:21,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:21,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:21,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:28:31<31:55:27, 7.02s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:28:31<31:55:27, 7.02s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:33,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:33,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:28:38<31:43:20, 6.97s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:28:38<31:43:20, 6.97s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:28:38<31:43:20, 6.97s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:42,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:42,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9441, 'learning_rate': 9.727434679334917e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:42,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:42,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:42,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:28:51<31:15:56, 6.87s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:28:51<31:15:56, 6.87s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:53,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:53,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1463/17840 [2:28:58<30:58:04, 6.81s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1463/17840 [2:28:58<30:58:04, 6.81s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:00,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:29:05<30:49:35, 6.78s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:29:05<30:49:35, 6.78s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8304, 'learning_rate': 9.725653206650832e-05, 'epoch': 1.64} + 8%|█████▉ | 1464/17840 [2:29:05<30:49:35, 6.78s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:08,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:08,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3866, 'learning_rate': 9.725059382422804e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:08,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:08,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:08,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:29:18<30:18:10, 6.66s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:18,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:18,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:18,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:29:24<30:00:16, 6.60s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:25,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:25,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:25,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:29:31<29:49:27, 6.56s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:29:31<29:49:27, 6.56s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:29:31<29:49:27, 6.56s/it]g-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:34,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:34,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1538, 'learning_rate': 9.722684085510689e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:34,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:41,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:41,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.985, 'learning_rate': 9.72209026128266e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:41,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:47,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:47,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1867, 'learning_rate': 9.721496437054632e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:47,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:53,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:53,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7596, 'learning_rate': 9.720902612826604e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:53,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:59,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:59,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9977, 'learning_rate': 9.720308788598576e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:59,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:59,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:59,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:08:10,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:30:09<28:32:42, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:07,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:30:09<28:32:42, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:07,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:30:09<28:32:42, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:07,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:30:09<28:32:42, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:07,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:30:17<31:13:43, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:30:17<31:13:43, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:20,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:20,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2788, 'learning_rate': 9.718527315914489e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:20,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:25,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:25,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3532, 'learning_rate': 9.717933491686461e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:30,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1478/17840 [2:30:34<27:48:01, 6.12s/it]g-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1478/17840 [2:30:34<27:48:01, 6.12s/it]g-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:34,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:34,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:34,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:15,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:30:40<27:00:33, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:30:40<27:00:33, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:42,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:42,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1322, 'learning_rate': 9.716152019002376e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:46,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1481/17840 [2:30:50<25:38:47, 5.64s/it]g-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1481/17840 [2:30:50<25:38:47, 5.64s/it]g-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:50,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:50,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:50,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1482/17840 [2:30:55<24:50:10, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:54,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:56,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:54,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1483/17840 [2:31:00<24:00:06, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1483/17840 [2:31:00<24:00:06, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0666, 'learning_rate': 9.71437054631829e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:02,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:02,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:04,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:06,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:06,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:12,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:14,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:14,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:16,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:17,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:17,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:21,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:21,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:22,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:24,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:24,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:26,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:26,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:28,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:28,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.135, 'learning_rate': 9.709026128266034e-05, 'epoch': 1.67} +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:32,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:32,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:35,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:35,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.205, 'learning_rate': 9.708432304038006e-05, 'epoch': 1.67} +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:39,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:39,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:39,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:31:46<23:57:59, 5.28s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:47,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:47,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:31:54<27:00:16, 5.95s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:31:54<27:00:16, 5.95s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3499, 'learning_rate': 9.707244655581948e-05, 'epoch': 1.68} + 8%|██████ | 1495/17840 [2:31:54<27:00:16, 5.95s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:31:54<27:00:16, 5.95s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:32:01<28:51:22, 6.36s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:32:01<28:51:22, 6.36s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1733, 'learning_rate': 9.706650831353919e-05, 'epoch': 1.68} + 8%|██████ | 1496/17840 [2:32:01<28:51:22, 6.36s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:05,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:05,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2554, 'learning_rate': 9.706057007125891e-05, 'epoch': 1.68} +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:05,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:05,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:32:16<31:04:06, 6.84s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:32:16<31:04:06, 6.84s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2014, 'learning_rate': 9.705463182897863e-05, 'epoch': 1.68} + 8%|██████▏ | 1498/17840 [2:32:16<31:04:06, 6.84s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:32:16<31:04:06, 6.84s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:32:16<31:04:06, 6.84s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:32:23<31:40:41, 6.98s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:23,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:23,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1500/17840 [2:32:33<35:24:01, 7.80s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1500/17840 [2:32:33<35:24:01, 7.80s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1126, 'learning_rate': 9.704275534441806e-05, 'epoch': 1.68} + 8%|██████▏ | 1500/17840 [2:32:33<35:24:01, 7.80s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1500/17840 [2:32:33<35:24:01, 7.80s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1501/17840 [2:32:40<34:43:51, 7.65s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1501/17840 [2:32:40<34:43:51, 7.65s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4676, 'learning_rate': 9.703681710213777e-05, 'epoch': 1.68} +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:42,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1502/17840 [2:32:47<33:52:08, 7.46s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1502/17840 [2:32:47<33:52:08, 7.46s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3524, 'learning_rate': 9.703087885985749e-05, 'epoch': 1.68} + 8%|██████▏ | 1502/17840 [2:32:47<33:52:08, 7.46s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1502/17840 [2:32:47<33:52:08, 7.46s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1503/17840 [2:32:54<33:14:26, 7.32s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1503/17840 [2:32:54<33:14:26, 7.32s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2967, 'learning_rate': 9.702494061757719e-05, 'epoch': 1.68} +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:33:01<32:49:45, 7.23s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:33:01<32:49:45, 7.23s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:33:01<32:49:45, 7.23s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:33:01<32:49:45, 7.23s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:33:01<32:49:45, 7.23s/it]g-point operations will not be computed-17 19:11:58,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:33:08<32:27:10, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:33:08<32:27:10, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:33:08<32:27:10, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:33:08<32:27:10, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:33:15<32:10:18, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:33:15<32:10:18, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:33:15<32:10:18, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:33:15<32:10:18, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:19,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:19,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:19,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:19,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:19,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1508/17840 [2:33:29<31:43:45, 6.99s/it]g-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:29,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:29,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:29,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1509/17840 [2:33:35<31:30:19, 6.95s/it]g-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1509/17840 [2:33:35<31:30:19, 6.95s/it]g-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1509/17840 [2:33:35<31:30:19, 6.95s/it]g-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:39,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:39,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0551, 'learning_rate': 9.698337292161521e-05, 'epoch': 1.69} +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:39,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:39,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:39,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:07,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:49<31:07:30, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:49<31:07:30, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:49<31:07:30, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:49<31:07:30, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1512/17840 [2:33:56<31:02:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1512/17840 [2:33:56<31:02:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:58,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1513/17840 [2:34:03<30:51:59, 6.81s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1513/17840 [2:34:03<30:51:59, 6.81s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1537, 'learning_rate': 9.696555819477436e-05, 'epoch': 1.7} + 8%|██████▏ | 1513/17840 [2:34:03<30:51:59, 6.81s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:06,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:06,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6683, 'learning_rate': 9.695961995249406e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:06,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:06,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:06,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1515/17840 [2:34:16<30:42:06, 6.77s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:16,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:16,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1516/17840 [2:34:23<30:22:28, 6.70s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1516/17840 [2:34:23<30:22:28, 6.70s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.272, 'learning_rate': 9.694774346793349e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:24,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1517/17840 [2:34:29<29:58:30, 6.61s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1517/17840 [2:34:29<29:58:30, 6.61s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1667, 'learning_rate': 9.694180522565321e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:31,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1518/17840 [2:34:35<29:45:46, 6.56s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1518/17840 [2:34:35<29:45:46, 6.56s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3599, 'learning_rate': 9.693586698337293e-05, 'epoch': 1.7} + 9%|██████▏ | 1518/17840 [2:34:35<29:45:46, 6.56s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:39,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:39,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0558, 'learning_rate': 9.692992874109265e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:39,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:45,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:45,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1359, 'learning_rate': 9.692399049881236e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:45,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:45,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:45,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1521/17840 [2:34:54<29:08:47, 6.43s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:55,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:55,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:55,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1522/17840 [2:35:01<28:59:08, 6.39s/it]g-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:01,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:01,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:01,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1523/17840 [2:35:07<28:41:32, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1523/17840 [2:35:07<28:41:32, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1523/17840 [2:35:07<28:41:32, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1523/17840 [2:35:07<28:41:32, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1524/17840 [2:35:13<28:28:26, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:13,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:13,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1525/17840 [2:35:22<31:20:28, 6.92s/it]g-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1525/17840 [2:35:22<31:20:28, 6.92s/it]g-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:22,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:22,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:22,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1526/17840 [2:35:27<29:58:16, 6.61s/it]g-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:27,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:27,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:27,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1527/17840 [2:35:33<28:59:39, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1527/17840 [2:35:33<28:59:39, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:36,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:36,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1207, 'learning_rate': 9.687648456057008e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:36,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:42,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:42,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0269, 'learning_rate': 9.687054631828979e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:46,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1530/17840 [2:35:50<26:49:08, 5.92s/it]g-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1530/17840 [2:35:50<26:49:08, 5.92s/it]g-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:50,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:50,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:50,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:32,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1531/17840 [2:35:56<26:00:12, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:54,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1531/17840 [2:35:56<26:00:12, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:54,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:54,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:54,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2594, 'learning_rate': 9.685273159144893e-05, 'epoch': 1.72} +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:02,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:54,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:02,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:54,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1533/17840 [2:36:06<24:23:10, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:06,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1534/17840 [2:36:11<23:28:47, 5.18s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1534/17840 [2:36:11<23:28:47, 5.18s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:10,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:12,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:12,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:14,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:16,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:16,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:18,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:20,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:20,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:21,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:21,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:24,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:26,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:26,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:29,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:29,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:30,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:30,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:32,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:32,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:33,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:37,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:37,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:37,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:41,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:41,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:45,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:45,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:45,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:49,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1545/17840 [2:36:59<27:10:44, 6.00s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1545/17840 [2:36:59<27:10:44, 6.00s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1545/17840 [2:36:59<27:10:44, 6.00s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:04,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:04,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2873, 'learning_rate': 9.676959619952495e-05, 'epoch': 1.73} +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:04,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:04,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:04,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:37:14<30:32:47, 6.75s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:37:14<30:32:47, 6.75s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:37:14<30:32:47, 6.75s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:37:14<30:32:47, 6.75s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:37:14<30:32:47, 6.75s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1548/17840 [2:37:22<31:18:18, 6.92s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:22,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:22,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:37:29<31:48:56, 7.03s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:37:29<31:48:56, 7.03s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4483, 'learning_rate': 9.675178147268409e-05, 'epoch': 1.74} + 9%|██████▎ | 1549/17840 [2:37:29<31:48:56, 7.03s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:37:29<31:48:56, 7.03s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:37:29<31:48:56, 7.03s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:37:38<35:11:32, 7.78s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:37:38<35:11:32, 7.78s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:37:38<35:11:32, 7.78s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:37:38<35:11:32, 7.78s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:37:38<35:11:32, 7.78s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1551/17840 [2:37:46<34:36:07, 7.65s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:46,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:46,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:37:53<34:03:45, 7.53s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:37:53<34:03:45, 7.53s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6695, 'learning_rate': 9.673396674584323e-05, 'epoch': 1.74} + 9%|██████▎ | 1552/17840 [2:37:53<34:03:45, 7.53s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:37:53<34:03:45, 7.53s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:37:53<34:03:45, 7.53s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1553/17840 [2:38:00<33:23:30, 7.38s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:00,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:00,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:00,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1554/17840 [2:38:07<32:51:17, 7.26s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1554/17840 [2:38:07<32:51:17, 7.26s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1554/17840 [2:38:07<32:51:17, 7.26s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1911, 'learning_rate': 9.671615201900238e-05, 'epoch': 1.74} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1556/17840 [2:38:21<32:20:15, 7.15s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1556/17840 [2:38:21<32:20:15, 7.15s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1556/17840 [2:38:21<32:20:15, 7.15s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:25,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:25,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4345, 'learning_rate': 9.670427553444181e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:25,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:25,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:25,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1558/17840 [2:38:35<31:51:14, 7.04s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:35,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:35,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1559/17840 [2:38:42<31:35:36, 6.99s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1559/17840 [2:38:42<31:35:36, 6.99s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0883, 'learning_rate': 9.669239904988125e-05, 'epoch': 1.75} + 9%|██████▍ | 1559/17840 [2:38:42<31:35:36, 6.99s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:45,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:45,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4396, 'learning_rate': 9.668646080760096e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:45,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:45,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1561/17840 [2:38:55<31:12:57, 6.90s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1561/17840 [2:38:55<31:12:57, 6.90s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:56,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:56,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1562/17840 [2:39:02<31:00:01, 6.86s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1562/17840 [2:39:02<31:00:01, 6.86s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5551, 'learning_rate': 9.667458432304038e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:04,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:39:09<30:53:23, 6.83s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:39:09<30:53:23, 6.83s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.59, 'learning_rate': 9.666864608076009e-05, 'epoch': 1.75} + 9%|██████▍ | 1563/17840 [2:39:09<30:53:23, 6.83s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:39:09<30:53:23, 6.83s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:39:09<30:53:23, 6.83s/it]g-point operations will not be computed-17 19:17:04,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1564/17840 [2:39:16<30:44:33, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1564/17840 [2:39:16<30:44:33, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1564/17840 [2:39:16<30:44:33, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1565/17840 [2:39:22<30:25:52, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1565/17840 [2:39:22<30:25:52, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:22,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:22,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1566/17840 [2:39:29<30:12:12, 6.68s/it]g-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1566/17840 [2:39:29<30:12:12, 6.68s/it]g-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3777, 'learning_rate': 9.665083135391925e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:31,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1567/17840 [2:39:35<30:00:32, 6.64s/it]g-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1567/17840 [2:39:35<30:00:32, 6.64s/it]g-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4091, 'learning_rate': 9.664489311163896e-05, 'epoch': 1.76} + 9%|██████▍ | 1567/17840 [2:39:35<30:00:32, 6.64s/it]g-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:39,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:39,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3629, 'learning_rate': 9.663895486935868e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:39,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:45,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:45,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:45,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3297, 'learning_rate': 9.663301662707838e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:45,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:45,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:14,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1570/17840 [2:39:55<29:15:15, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:53,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1570/17840 [2:39:55<29:15:15, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:53,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1570/17840 [2:39:55<29:15:15, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:53,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1570/17840 [2:39:55<29:15:15, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:53,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1571/17840 [2:40:01<29:02:25, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:59,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1571/17840 [2:40:01<29:02:25, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:59,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1571/17840 [2:40:01<29:02:25, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:59,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1571/17840 [2:40:01<29:02:25, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:59,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1572/17840 [2:40:07<28:54:30, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:06,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1572/17840 [2:40:07<28:54:30, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:06,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1572/17840 [2:40:07<28:54:30, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:06,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1572/17840 [2:40:07<28:54:30, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:06,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1573/17840 [2:40:13<28:37:56, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:12,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1573/17840 [2:40:13<28:37:56, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:12,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1573/17840 [2:40:13<28:37:56, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:12,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1573/17840 [2:40:13<28:37:56, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:12,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1574/17840 [2:40:20<28:23:05, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1574/17840 [2:40:20<28:23:05, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1574/17840 [2:40:20<28:23:05, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1574/17840 [2:40:20<28:23:05, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1575/17840 [2:40:28<31:10:49, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:28,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:28,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:28,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1576/17840 [2:40:34<29:57:53, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1576/17840 [2:40:34<29:57:53, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:37,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:37,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.289, 'learning_rate': 9.65855106888361e-05, 'epoch': 1.77} +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:37,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:37,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:42,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:42,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:47,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:47,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1579/17840 [2:40:51<27:11:03, 6.02s/it]g-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1579/17840 [2:40:51<27:11:03, 6.02s/it]g-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:52,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:52,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1580/17840 [2:40:57<26:23:40, 5.84s/it]g-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:56,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:56,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:59,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:59,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:03,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:03,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1582/17840 [2:41:07<24:55:08, 5.52s/it]g-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:06,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:09,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:09,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:11,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:13,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:13,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2484, 'learning_rate': 9.654394299287411e-05, 'epoch': 1.78} +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:16,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:16,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:32,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1585/17840 [2:41:21<21:47:54, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:19,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:21,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:19,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:21,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:19,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1586/17840 [2:41:25<20:36:10, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:22,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1587/17840 [2:41:28<19:18:03, 4.28s/it]g-point operations will not be computed-17 19:22:22,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1587/17840 [2:41:28<19:18:03, 4.28s/it]g-point operations will not be computed-17 19:22:22,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1587/17840 [2:41:28<19:18:03, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:26,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1587/17840 [2:41:28<19:18:03, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:26,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1588/17840 [2:41:31<17:54:27, 3.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1589/17840 [2:41:34<16:30:49, 3.66s/it]g-point operations will not be computed-17 19:22:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1589/17840 [2:41:34<16:30:49, 3.66s/it]g-point operations will not be computed-17 19:22:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:33,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:32,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:33,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:32,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1590/17840 [2:41:37<15:12:40, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:35,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1590/17840 [2:41:37<15:12:40, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:35,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1591/17840 [2:41:39<13:58:11, 3.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:37,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1591/17840 [2:41:39<13:58:11, 3.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:37,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1592/17840 [2:41:42<12:39:43, 2.81s/it]g-point operations will not be computed-17 19:22:37,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1592/17840 [2:41:42<12:39:43, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:41,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1592/17840 [2:41:42<12:39:43, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:41,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:44,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:41,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:44,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:41,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1593/17840 [2:41:49<19:25:51, 4.31s/it]g-point operations will not be computed-17 19:22:41,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1593/17840 [2:41:49<19:25:51, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1593/17840 [2:41:49<19:25:51, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:52,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:52,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1594/17840 [2:41:57<23:50:48, 5.28s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:58,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:58,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1595/17840 [2:42:05<26:54:20, 5.96s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1595/17840 [2:42:05<26:54:20, 5.96s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1514, 'learning_rate': 9.647862232779098e-05, 'epoch': 1.79} + 9%|██████▌ | 1595/17840 [2:42:05<26:54:20, 5.96s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1595/17840 [2:42:05<26:54:20, 5.96s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1595/17840 [2:42:05<26:54:20, 5.96s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:42:12<28:45:37, 6.37s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:42:12<28:45:37, 6.37s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:14,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1597/17840 [2:42:19<30:05:56, 6.67s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1597/17840 [2:42:19<30:05:56, 6.67s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1506, 'learning_rate': 9.64667458432304e-05, 'epoch': 1.79} + 9%|██████▌ | 1597/17840 [2:42:19<30:05:56, 6.67s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1597/17840 [2:42:19<30:05:56, 6.67s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1598/17840 [2:42:26<30:55:16, 6.85s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1598/17840 [2:42:26<30:55:16, 6.85s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.187, 'learning_rate': 9.646080760095013e-05, 'epoch': 1.79} + 9%|██████▌ | 1598/17840 [2:42:26<30:55:16, 6.85s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1598/17840 [2:42:26<30:55:16, 6.85s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1598/17840 [2:42:26<30:55:16, 6.85s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1599/17840 [2:42:34<31:28:42, 6.98s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1599/17840 [2:42:34<31:28:42, 6.98s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:36,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:42:43<35:01:08, 7.76s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:42:43<35:01:08, 7.76s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5896, 'learning_rate': 9.644893111638955e-05, 'epoch': 1.79} + 9%|██████▌ | 1600/17840 [2:42:43<35:01:08, 7.76s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:42:43<35:01:08, 7.76s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:42:43<35:01:08, 7.76s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:42:51<34:26:34, 7.64s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:42:51<34:26:34, 7.64s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:42:51<34:26:34, 7.64s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:42:51<34:26:34, 7.64s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:42:51<34:26:34, 7.64s/it]g-point operations will not be computed-17 19:22:48,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1602/17840 [2:42:58<33:55:15, 7.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1602/17840 [2:42:58<33:55:15, 7.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1602/17840 [2:42:58<33:55:15, 7.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1603/17840 [2:43:05<33:22:21, 7.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1603/17840 [2:43:05<33:22:21, 7.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4424, 'learning_rate': 9.64311163895487e-05, 'epoch': 1.8} + 9%|██████▌ | 1603/17840 [2:43:05<33:22:21, 7.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:09,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:09,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0827, 'learning_rate': 9.642517814726841e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:09,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:09,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1605/17840 [2:43:19<32:24:18, 7.19s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1605/17840 [2:43:19<32:24:18, 7.19s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4371, 'learning_rate': 9.641923990498813e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:21,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1606/17840 [2:43:26<32:14:07, 7.15s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1606/17840 [2:43:26<32:14:07, 7.15s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3504, 'learning_rate': 9.641330166270785e-05, 'epoch': 1.8} + 9%|██████▌ | 1606/17840 [2:43:26<32:14:07, 7.15s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1606/17840 [2:43:26<32:14:07, 7.15s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1606/17840 [2:43:26<32:14:07, 7.15s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1607/17840 [2:43:33<31:51:45, 7.07s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:33,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:33,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1608/17840 [2:43:40<31:36:57, 7.01s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1608/17840 [2:43:40<31:36:57, 7.01s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2136, 'learning_rate': 9.640142517814727e-05, 'epoch': 1.8} + 9%|██████▌ | 1608/17840 [2:43:40<31:36:57, 7.01s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.173, 'learning_rate': 9.639548693586698e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1610/17840 [2:43:53<31:04:51, 6.89s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1610/17840 [2:43:53<31:04:51, 6.89s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:54,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:54,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:54,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1611/17840 [2:44:00<30:54:06, 6.85s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1611/17840 [2:44:00<30:54:06, 6.85s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1611/17840 [2:44:00<30:54:06, 6.85s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:04,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:04,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.167, 'learning_rate': 9.637767220902614e-05, 'epoch': 1.81} +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:04,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:04,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1613/17840 [2:44:14<30:42:14, 6.81s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1613/17840 [2:44:14<30:42:14, 6.81s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:14,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:14,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:14,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1614/17840 [2:44:20<30:28:30, 6.76s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1614/17840 [2:44:20<30:28:30, 6.76s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:22,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:22,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1615/17840 [2:44:27<30:14:06, 6.71s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1615/17840 [2:44:27<30:14:06, 6.71s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1615/17840 [2:44:27<30:14:06, 6.71s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1615/17840 [2:44:27<30:14:06, 6.71s/it]g-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:30,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:30,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:30,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:37,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:37,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1879, 'learning_rate': 9.63479809976247e-05, 'epoch': 1.81} +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:37,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:37,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:37,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:23:57,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1618/17840 [2:44:46<29:22:11, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1618/17840 [2:44:46<29:22:11, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1618/17840 [2:44:46<29:22:11, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1618/17840 [2:44:46<29:22:11, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1619/17840 [2:44:53<29:17:52, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:53,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:53,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:53,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1620/17840 [2:44:59<29:12:03, 6.48s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:59,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:59,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:59,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1621/17840 [2:45:06<29:04:14, 6.45s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1621/17840 [2:45:06<29:04:14, 6.45s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:07,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:07,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:45:12<28:50:11, 6.40s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:45:12<28:50:11, 6.40s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:45:12<28:50:11, 6.40s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:45:12<28:50:11, 6.40s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:15,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:15,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:20,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:20,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1624/17840 [2:45:24<28:19:45, 6.29s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1624/17840 [2:45:24<28:19:45, 6.29s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:26,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:45:33<31:40:05, 7.03s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:45:33<31:40:05, 7.03s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3028, 'learning_rate': 9.630047505938243e-05, 'epoch': 1.82} + 9%|██████▋ | 1625/17840 [2:45:33<31:40:05, 7.03s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:36,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:36,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0353, 'learning_rate': 9.629453681710215e-05, 'epoch': 1.82} +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:36,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:42,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:42,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1346, 'learning_rate': 9.628859857482185e-05, 'epoch': 1.82} +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:42,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:42,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:48,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:48,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:52,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:52,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1629/17840 [2:45:56<27:27:07, 6.10s/it]g-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:56,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:56,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:56,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:45,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1630/17840 [2:46:02<26:42:14, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1630/17840 [2:46:02<26:42:14, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:04,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:04,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9675, 'learning_rate': 9.626484560570072e-05, 'epoch': 1.83} +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:08,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:08,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1632/17840 [2:46:13<25:22:06, 5.63s/it]g-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:12,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:15,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:15,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4358, 'learning_rate': 9.625296912114015e-05, 'epoch': 1.83} +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:18,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:18,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:00,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1634/17840 [2:46:22<23:33:51, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:20,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:23,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:20,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:23,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:20,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1635/17840 [2:46:27<22:18:22, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:25,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:27,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:25,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:27,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:25,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1636/17840 [2:46:31<21:08:11, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:29,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:31,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:29,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:31,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:29,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1637/17840 [2:46:35<19:51:00, 4.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:32,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:34,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:32,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:34,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:32,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1638/17840 [2:46:38<18:23:14, 4.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:36,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1638/17840 [2:46:38<18:23:14, 4.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:36,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███��██▋ | 1639/17840 [2:46:41<16:56:07, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:39,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1640/17840 [2:46:44<15:32:30, 3.45s/it]g-point operations will not be computed-17 19:27:39,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1640/17840 [2:46:44<15:32:30, 3.45s/it]g-point operations will not be computed-17 19:27:39,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:42,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:41,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:42,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:41,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:45,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:44,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:45,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:44,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1642/17840 [2:46:48<12:42:37, 2.82s/it]g-point operations will not be computed-17 19:27:44,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1642/17840 [2:46:48<12:42:37, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:47,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:51,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:47,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:56<19:20:13, 4.30s/it]g-point operations will not be computed-17 19:27:47,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:56<19:20:13, 4.30s/it]g-point operations will not be computed-17 19:27:47,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:56<19:20:13, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:56<19:20:13, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:58,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:58,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:47:03<23:41:07, 5.26s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:47:03<23:41:07, 5.26s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:47:03<23:41:07, 5.26s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:47:03<23:41:07, 5.26s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:47:03<23:41:07, 5.26s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1645/17840 [2:47:11<26:33:44, 5.90s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:11,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:11,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:47:18<28:33:48, 6.35s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:47:18<28:33:48, 6.35s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3679, 'learning_rate': 9.617577197149645e-05, 'epoch': 1.85} + 9%|██████▋ | 1646/17840 [2:47:18<28:33:48, 6.35s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:47:18<28:33:48, 6.35s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:47:18<28:33:48, 6.35s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:47:25<29:44:27, 6.61s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:47:25<29:44:27, 6.61s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:47:25<29:44:27, 6.61s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3239, 'learning_rate': 9.616389548693587e-05, 'epoch': 1.85} +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1649/17840 [2:47:40<31:06:21, 6.92s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1649/17840 [2:47:40<31:06:21, 6.92s/it]g-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:42,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:42,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:47:50<34:50:31, 7.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:47:50<34:50:31, 7.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:47:50<34:50:31, 7.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1651/17840 [2:47:57<34:11:39, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1651/17840 [2:47:57<34:11:39, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9051, 'learning_rate': 9.614608076009502e-05, 'epoch': 1.85} + 9%|██████▊ | 1651/17840 [2:47:57<34:11:39, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1651/17840 [2:47:57<34:11:39, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1651/17840 [2:47:57<34:11:39, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:28:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1652/17840 [2:48:04<33:30:16, 7.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1652/17840 [2:48:04<33:30:16, 7.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1652/17840 [2:48:04<33:30:16, 7.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1653/17840 [2:48:11<33:00:22, 7.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1653/17840 [2:48:11<33:00:22, 7.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9703, 'learning_rate': 9.613420427553445e-05, 'epoch': 1.85} + 9%|██████▊ | 1653/17840 [2:48:11<33:00:22, 7.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1653/17840 [2:48:11<33:00:22, 7.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1653/17840 [2:48:11<33:00:22, 7.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:03,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:48:18<32:30:08, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:48:18<32:30:08, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:48:18<32:30:08, 7.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:48:25<32:12:31, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:48:25<32:12:31, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2055, 'learning_rate': 9.612232779097387e-05, 'epoch': 1.86} + 9%|██████▊ | 1655/17840 [2:48:25<32:12:31, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:48:25<32:12:31, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:48:25<32:12:31, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1656/17840 [2:48:32<31:53:59, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1656/17840 [2:48:32<31:53:59, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1656/17840 [2:48:32<31:53:59, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:48:39<31:36:45, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:48:39<31:36:45, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4892, 'learning_rate': 9.61104513064133e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:41,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:48:46<31:21:50, 6.98s/it]g-point operations will not be computed-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:48:46<31:21:50, 6.98s/it]g-point operations will not be computed-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2934, 'learning_rate': 9.610451306413302e-05, 'epoch': 1.86} + 9%|██████▊ | 1658/17840 [2:48:46<31:21:50, 6.98s/it]g-point operations will not be computed-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:48:46<31:21:50, 6.98s/it]g-point operations will not be computed-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:48:46<31:21:50, 6.98s/it]g-point operations will not be computed-17 19:29:31,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1659/17840 [2:48:53<31:21:25, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1659/17840 [2:48:53<31:21:25, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1659/17840 [2:48:53<31:21:25, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1660/17840 [2:48:59<31:10:11, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1660/17840 [2:48:59<31:10:11, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1353, 'learning_rate': 9.609263657957245e-05, 'epoch': 1.86} + 9%|██████▊ | 1660/17840 [2:48:59<31:10:11, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:03,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:03,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1677, 'learning_rate': 9.608669833729217e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:03,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:03,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:03,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:51,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1662/17840 [2:49:13<30:46:10, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1662/17840 [2:49:13<30:46:10, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1662/17840 [2:49:13<30:46:10, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:49:20<30:36:16, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:49:20<30:36:16, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.209, 'learning_rate': 9.60748218527316e-05, 'epoch': 1.86} + 9%|██████▊ | 1663/17840 [2:49:20<30:36:16, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2678, 'learning_rate': 9.606888361045132e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:12,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1665/17840 [2:49:33<30:19:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1665/17840 [2:49:33<30:19:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1665/17840 [2:49:33<30:19:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1665/17840 [2:49:33<30:19:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1666/17840 [2:49:40<30:03:51, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:40,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:40,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:49:46<29:54:26, 6.66s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:49:46<29:54:26, 6.66s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:46,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:46,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1668/17840 [2:49:53<29:34:55, 6.59s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1668/17840 [2:49:53<29:34:55, 6.59s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3621, 'learning_rate': 9.604513064133017e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:54,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1669/17840 [2:49:59<29:27:36, 6.56s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1669/17840 [2:49:59<29:27:36, 6.56s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3748, 'learning_rate': 9.603919239904988e-05, 'epoch': 1.87} + 9%|██████▊ | 1669/17840 [2:49:59<29:27:36, 6.56s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1669/17840 [2:49:59<29:27:36, 6.56s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:09,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:09,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9964, 'learning_rate': 9.602731591448932e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:09,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:15,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:15,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0363, 'learning_rate': 9.602137767220904e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:15,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:21,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:21,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8083, 'learning_rate': 9.601543942992875e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:21,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:27,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:27,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4265, 'learning_rate': 9.600950118764847e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:27,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:27,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:27,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:27,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1596, 'learning_rate': 9.600356294536817e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:27,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:42,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:42,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1778, 'learning_rate': 9.59976247030879e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:42,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:47,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:47,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1514, 'learning_rate': 9.59916864608076e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:52,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:52,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1678/17840 [2:50:56<27:42:39, 6.17s/it]g-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:56,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:56,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:56,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:32,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1679/17840 [2:51:02<26:56:24, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1679/17840 [2:51:02<26:56:24, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:04,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:04,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0615, 'learning_rate': 9.597387173396675e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:08,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1681/17840 [2:51:13<25:30:07, 5.68s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1681/17840 [2:51:13<25:30:07, 5.68s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:12,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:15,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:15,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9569, 'learning_rate': 9.596199524940617e-05, 'epoch': 1.89} +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:18,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:18,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1683/17840 [2:51:22<23:38:48, 5.27s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:24,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:24,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:26,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:28,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:28,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:30,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:32,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:32,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:34,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:34,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:36,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:38,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:38,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:39,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:42,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:42,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:44,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:44,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:46,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:46,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:48,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:48,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:49,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:49,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:53,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:53,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:53,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:57,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:01,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:01,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:05,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:05,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3706, 'learning_rate': 9.589073634204276e-05, 'epoch': 1.9} +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:05,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:05,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:05,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:52:15<26:46:44, 5.97s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:52:15<26:46:44, 5.97s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:52:15<26:46:44, 5.97s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:20,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:20,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2107, 'learning_rate': 9.587885985748219e-05, 'epoch': 1.9} +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:20,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:20,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:52:30<29:48:58, 6.65s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:52:30<29:48:58, 6.65s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1901, 'learning_rate': 9.58729216152019e-05, 'epoch': 1.9} + 10%|██████▉ | 1697/17840 [2:52:30<29:48:58, 6.65s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:52:30<29:48:58, 6.65s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:52:30<29:48:58, 6.65s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:52:37<30:44:10, 6.85s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:52:37<30:44:10, 6.85s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:52:37<30:44:10, 6.85s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:42,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:42,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1769, 'learning_rate': 9.586104513064134e-05, 'epoch': 1.9} +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:42,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:42,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:52:54<34:46:06, 7.76s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:52:54<34:46:06, 7.76s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2541, 'learning_rate': 9.585510688836105e-05, 'epoch': 1.91} + 10%|██████▉ | 1700/17840 [2:52:54<34:46:06, 7.76s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:52:54<34:46:06, 7.76s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:52:54<34:46:06, 7.76s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1701/17840 [2:53:01<34:03:10, 7.60s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:02,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:02,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:53:09<33:33:17, 7.49s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:53:09<33:33:17, 7.49s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1792, 'learning_rate': 9.584323040380047e-05, 'epoch': 1.91} + 10%|██████▉ | 1702/17840 [2:53:09<33:33:17, 7.49s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:53:09<33:33:17, 7.49s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:53:09<33:33:17, 7.49s/it]g-point operations will not be computed-17 19:32:00,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1703/17840 [2:53:16<33:07:57, 7.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1703/17840 [2:53:16<33:07:57, 7.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1703/17840 [2:53:16<33:07:57, 7.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:53:23<32:38:27, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:53:23<32:38:27, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3944, 'learning_rate': 9.583135391923991e-05, 'epoch': 1.91} + 10%|██████▉ | 1704/17840 [2:53:23<32:38:27, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:53:23<32:38:27, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:53:23<32:38:27, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:53:30<32:14:02, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:53:30<32:14:02, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:53:30<32:14:02, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:53:37<31:57:26, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:53:37<31:57:26, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.074, 'learning_rate': 9.581947743467934e-05, 'epoch': 1.91} +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:39,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1707/17840 [2:53:44<31:29:55, 7.03s/it]g-point operations will not be computed-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1707/17840 [2:53:44<31:29:55, 7.03s/it]g-point operations will not be computed-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0849, 'learning_rate': 9.581353919239906e-05, 'epoch': 1.91} + 10%|██████▉ | 1707/17840 [2:53:44<31:29:55, 7.03s/it]g-point operations will not be computed-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1707/17840 [2:53:44<31:29:55, 7.03s/it]g-point operations will not be computed-17 19:34:29,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1708/17840 [2:53:50<31:17:40, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1708/17840 [2:53:50<31:17:40, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3583, 'learning_rate': 9.580760095011877e-05, 'epoch': 1.91} + 10%|██████▉ | 1708/17840 [2:53:50<31:17:40, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1709/17840 [2:53:57<31:04:23, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1709/17840 [2:53:57<31:04:23, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1214, 'learning_rate': 9.580166270783848e-05, 'epoch': 1.92} + 10%|██████▉ | 1709/17840 [2:53:57<31:04:23, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:01,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:01,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9757, 'learning_rate': 9.57957244655582e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:01,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:01,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1711/17840 [2:54:11<30:42:53, 6.86s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1711/17840 [2:54:11<30:42:53, 6.86s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:11,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:11,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1712/17840 [2:54:18<30:29:20, 6.81s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1712/17840 [2:54:18<30:29:20, 6.81s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0752, 'learning_rate': 9.578384798099764e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:20,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:20,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:54:24<30:24:26, 6.79s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:54:24<30:24:26, 6.79s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:54:24<30:24:26, 6.79s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:28,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:28,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9402, 'learning_rate': 9.577197149643706e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:28,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:28,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:28,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1715/17840 [2:54:38<30:04:42, 6.72s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:38,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:38,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:38,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1716/17840 [2:54:44<29:57:19, 6.69s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:44,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:44,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:44,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:54:51<29:42:09, 6.63s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:54:51<29:42:09, 6.63s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:52,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1718/17840 [2:54:57<29:29:44, 6.59s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1718/17840 [2:54:57<29:29:44, 6.59s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0737, 'learning_rate': 9.574821852731592e-05, 'epoch': 1.93} + 10%|███████ | 1718/17840 [2:54:57<29:29:44, 6.59s/it]g-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:00,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:00,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2717, 'learning_rate': 9.574228028503564e-05, 'epoch': 1.93} +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:00,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0762, 'learning_rate': 9.573634204275535e-05, 'epoch': 1.93} +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:49,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:55:16<28:48:57, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:15,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:55:16<28:48:57, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:15,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:55:16<28:48:57, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:15,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:55:16<28:48:57, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:15,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1722/17840 [2:55:23<28:33:30, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:21,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1722/17840 [2:55:23<28:33:30, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:21,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1722/17840 [2:55:23<28:33:30, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:21,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1722/17840 [2:55:23<28:33:30, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:21,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1723/17840 [2:55:29<28:22:48, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:27,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1723/17840 [2:55:29<28:22:48, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:27,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1723/17840 [2:55:29<28:22:48, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:27,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1723/17840 [2:55:29<28:22:48, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:27,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1724/17840 [2:55:35<28:09:39, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:33,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1724/17840 [2:55:35<28:09:39, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:33,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1724/17840 [2:55:35<28:09:39, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:33,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1725/17840 [2:55:43<31:04:46, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:33,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1725/17840 [2:55:43<31:04:46, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:33,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0341, 'learning_rate': 9.570665083135393e-05, 'epoch': 1.93} +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:45,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:33,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:45,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:33,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:55:49<29:45:08, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:48,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:55:49<29:45:08, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:48,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:55:49<29:45:08, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:48,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:55:49<29:45:08, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:48,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1727/17840 [2:55:55<28:40:15, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1727/17840 [2:55:55<28:40:15, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:58,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:58,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3568, 'learning_rate': 9.568883610451307e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:02,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1729/17840 [2:56:07<27:03:27, 6.05s/it]g-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1729/17840 [2:56:07<27:03:27, 6.05s/it]g-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.331, 'learning_rate': 9.568289786223277e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:08,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1730/17840 [2:56:12<26:21:29, 5.89s/it]g-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1730/17840 [2:56:12<26:21:29, 5.89s/it]g-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:12,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:14,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:14,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0743, 'learning_rate': 9.567102137767221e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:18,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1732/17840 [2:56:23<24:51:07, 5.55s/it]g-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1732/17840 [2:56:23<24:51:07, 5.55s/it]g-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:22,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:25,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:25,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0392, 'learning_rate': 9.565914489311164e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:28,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1734/17840 [2:56:32<23:17:03, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:31,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1734/17840 [2:56:32<23:17:03, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:31,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:33,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:31,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1735/17840 [2:56:37<22:18:49, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:35,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1735/17840 [2:56:37<22:18:49, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:35,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:37,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:35,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1736/17840 [2:56:41<21:06:47, 4.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:39,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1736/17840 [2:56:41<21:06:47, 4.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:39,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:41,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:39,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1737/17840 [2:56:45<19:49:08, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:43,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1737/17840 [2:56:45<19:49:08, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:43,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1738/17840 [2:56:48<18:21:58, 4.11s/it]g-point operations will not be computed-17 19:37:43,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1738/17840 [2:56:48<18:21:58, 4.11s/it]g-point operations will not be computed-17 19:37:43,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1738/17840 [2:56:48<18:21:58, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:46,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1739/17840 [2:56:51<16:55:44, 3.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:49,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1739/17840 [2:56:51<16:55:44, 3.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:49,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1740/17840 [2:56:54<15:22:22, 3.44s/it]g-point operations will not be computed-17 19:37:49,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1740/17840 [2:56:54<15:22:22, 3.44s/it]g-point operations will not be computed-17 19:37:49,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1741/17840 [2:56:56<13:53:57, 3.11s/it]g-point operations will not be computed-17 19:37:51,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1741/17840 [2:56:56<13:53:57, 3.11s/it]g-point operations will not be computed-17 19:37:51,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:55,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:54,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1742/17840 [2:56:58<12:43:18, 2.85s/it]g-point operations will not be computed-17 19:37:54,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1742/17840 [2:56:58<12:43:18, 2.85s/it]g-point operations will not be computed-17 19:37:54,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1742/17840 [2:56:58<12:43:18, 2.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:01,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:01,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1743/17840 [2:57:06<19:21:59, 4.33s/it]g-point operations will not be computed-17 19:37:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1743/17840 [2:57:06<19:21:59, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1743/17840 [2:57:06<19:21:59, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:09,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:09,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1744/17840 [2:57:14<23:48:30, 5.32s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1744/17840 [2:57:14<23:48:30, 5.32s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1744/17840 [2:57:14<23:48:30, 5.32s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1744/17840 [2:57:14<23:48:30, 5.32s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1744/17840 [2:57:14<23:48:30, 5.32s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:57:21<26:45:01, 5.98s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:57:21<26:45:01, 5.98s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:57:21<26:45:01, 5.98s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:57:21<26:45:01, 5.98s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:26,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:26,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:26,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:26,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:26,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1747/17840 [2:57:36<29:59:08, 6.71s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1747/17840 [2:57:36<29:59:08, 6.71s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1747/17840 [2:57:36<29:59:08, 6.71s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:40,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:40,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9858, 'learning_rate': 9.557007125890737e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:40,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:40,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:40,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:51<31:06:11, 6.96s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:51<31:06:11, 6.96s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:51<31:06:11, 6.96s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:51<31:06:11, 6.96s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:51<31:06:11, 6.96s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:58:00<34:49:19, 7.79s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:58:00<34:49:19, 7.79s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:58:00<34:49:19, 7.79s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:04,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:04,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1191, 'learning_rate': 9.555225653206651e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:04,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:04,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:04,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1752/17840 [2:58:14<33:10:51, 7.42s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1752/17840 [2:58:14<33:10:51, 7.42s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:17,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:58:21<32:39:11, 7.31s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:58:21<32:39:11, 7.31s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2412, 'learning_rate': 9.554038004750594e-05, 'epoch': 1.97} + 10%|███████▏ | 1753/17840 [2:58:21<32:39:11, 7.31s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:58:21<32:39:11, 7.31s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:58:21<32:39:11, 7.31s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1754/17840 [2:58:28<32:10:31, 7.20s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:29,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:58:35<31:48:33, 7.12s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:58:35<31:48:33, 7.12s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:58:35<31:48:33, 7.12s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0982, 'learning_rate': 9.552256532066509e-05, 'epoch': 1.97} +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1757/17840 [2:58:49<31:15:09, 7.00s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:49,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:49,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1758/17840 [2:58:56<30:55:47, 6.92s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1758/17840 [2:58:56<30:55:47, 6.92s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4141, 'learning_rate': 9.551068883610453e-05, 'epoch': 1.97} +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:58,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:59:03<30:39:58, 6.87s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:59:03<30:39:58, 6.87s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0331, 'learning_rate': 9.550475059382424e-05, 'epoch': 1.97} + 10%|███████▏ | 1759/17840 [2:59:03<30:39:58, 6.87s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:59:03<30:39:58, 6.87s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:59:03<30:39:58, 6.87s/it]g-point operations will not be computed-17 19:38:05,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:59:09<30:30:41, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:59:09<30:30:41, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:59:09<30:30:41, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1761/17840 [2:59:16<30:21:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1761/17840 [2:59:16<30:21:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1764, 'learning_rate': 9.549287410926366e-05, 'epoch': 1.97} + 10%|███████▏ | 1761/17840 [2:59:16<30:21:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:20,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:20,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5214, 'learning_rate': 9.548693586698337e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:20,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:26,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:26,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2756, 'learning_rate': 9.548099762470309e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:26,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:32,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:32,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2214, 'learning_rate': 9.547505938242281e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:32,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:32,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:32,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:08,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1765/17840 [2:59:42<29:12:11, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1765/17840 [2:59:42<29:12:11, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1765/17840 [2:59:42<29:12:11, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1766/17840 [2:59:48<29:03:21, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1766/17840 [2:59:48<29:03:21, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:49,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:49,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1767/17840 [2:59:55<28:47:43, 6.45s/it]g-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1767/17840 [2:59:55<28:47:43, 6.45s/it]g-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:55,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:55,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1768/17840 [3:00:01<28:32:04, 6.39s/it]g-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1768/17840 [3:00:01<28:32:04, 6.39s/it]g-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:01,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:01,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1769/17840 [3:00:07<28:07:41, 6.30s/it]g-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1769/17840 [3:00:07<28:07:41, 6.30s/it]g-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:07,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:07,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:41,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1770/17840 [3:00:13<27:36:22, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1770/17840 [3:00:13<27:36:22, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9891, 'learning_rate': 9.543942992874109e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:16,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:16,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:16,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2207, 'learning_rate': 9.543349168646081e-05, 'epoch': 1.99} +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:22,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:22,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0881, 'learning_rate': 9.542755344418053e-05, 'epoch': 1.99} +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:26,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:26,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1773/17840 [3:00:30<26:18:04, 5.89s/it]g-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:30,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:30,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:30,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:11,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███��███▎ | 1774/17840 [3:00:36<25:46:49, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1774/17840 [3:00:36<25:46:49, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1774/17840 [3:00:36<25:46:49, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1774/17840 [3:00:36<25:46:49, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1775/17840 [3:00:43<27:58:42, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1775/17840 [3:00:43<27:58:42, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:44,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:44,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1776/17840 [3:00:48<26:22:03, 5.91s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:48,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:48,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:50,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:52,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:52,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:54,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:56,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:56,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:58,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:00,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:00,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:01,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:04,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:04,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:06,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:06,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:08,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:08,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:11,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:11,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:12,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:12,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:16,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:16,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:16,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:20,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:20,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:24,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:24,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:24,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [3:01:30<24:04:26, 5.40s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [3:01:30<24:04:26, 5.40s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [3:01:30<24:04:26, 5.40s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:35,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:35,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8469, 'learning_rate': 9.533847980997626e-05, 'epoch': 2.0} +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:35,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:35,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:35,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:45<28:44:17, 6.45s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:45<28:44:17, 6.45s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:45<28:44:17, 6.45s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:45<28:44:17, 6.45s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:45<28:44:17, 6.45s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1789/17840 [3:01:53<29:55:43, 6.71s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:53,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:53,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1790/17840 [3:02:00<30:45:37, 6.90s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1790/17840 [3:02:00<30:45:37, 6.90s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9095, 'learning_rate': 9.532066508313539e-05, 'epoch': 2.01} + 10%|███████▎ | 1790/17840 [3:02:00<30:45:37, 6.90s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1790/17840 [3:02:00<30:45:37, 6.90s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1790/17840 [3:02:00<30:45:37, 6.90s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [3:02:07<31:06:19, 6.98s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [3:02:07<31:06:19, 6.98s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1792/17840 [3:02:14<31:25:48, 7.05s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1792/17840 [3:02:14<31:25:48, 7.05s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9992, 'learning_rate': 9.530878859857483e-05, 'epoch': 2.01} + 10%|███████▎ | 1792/17840 [3:02:14<31:25:48, 7.05s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1792/17840 [3:02:14<31:25:48, 7.05s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1792/17840 [3:02:14<31:25:48, 7.05s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:02:22<31:38:48, 7.10s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:02:22<31:38:48, 7.10s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:02:22<31:38:48, 7.10s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:26,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:26,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8119, 'learning_rate': 9.529691211401426e-05, 'epoch': 2.01} +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:26,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:26,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:26,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [3:02:36<31:41:32, 7.11s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [3:02:36<31:41:32, 7.11s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:38,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:43<31:40:14, 7.11s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:43<31:40:14, 7.11s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0333, 'learning_rate': 9.528503562945369e-05, 'epoch': 2.01} + 10%|███████▎ | 1796/17840 [3:02:43<31:40:14, 7.11s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:43<31:40:14, 7.11s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:43<31:40:14, 7.11s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1797/17840 [3:02:50<31:35:59, 7.09s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:50,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:50,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1798/17840 [3:02:57<31:29:59, 7.07s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1798/17840 [3:02:57<31:29:59, 7.07s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6415, 'learning_rate': 9.527315914489313e-05, 'epoch': 2.02} + 10%|███████▎ | 1798/17840 [3:02:57<31:29:59, 7.07s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:01,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:01,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0047, 'learning_rate': 9.526722090261283e-05, 'epoch': 2.02} +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:01,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:01,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:03:13<34:19:42, 7.70s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:03:13<34:19:42, 7.70s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9737, 'learning_rate': 9.526128266033255e-05, 'epoch': 2.02} + 10%|███████▎ | 1800/17840 [3:03:13<34:19:42, 7.70s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:03:13<34:19:42, 7.70s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:03:13<34:19:42, 7.70s/it]g-point operations will not be computed-17 19:41:34,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [3:03:20<33:16:39, 7.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [3:03:20<33:16:39, 7.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [3:03:20<33:16:39, 7.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [3:03:20<33:16:39, 7.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [3:03:27<32:24:35, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [3:03:27<32:24:35, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [3:03:27<32:24:35, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:31,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:31,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8908, 'learning_rate': 9.524346793349169e-05, 'epoch': 2.02} +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:31,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:31,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:31,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:19,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1804/17840 [3:03:41<31:21:20, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1804/17840 [3:03:41<31:21:20, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1804/17840 [3:03:41<31:21:20, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1804/17840 [3:03:41<31:21:20, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [3:03:47<30:58:30, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [3:03:47<30:58:30, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:49,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1806/17840 [3:03:54<30:39:54, 6.89s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1806/17840 [3:03:54<30:39:54, 6.89s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6839, 'learning_rate': 9.522565320665083e-05, 'epoch': 2.02} + 10%|███████▍ | 1806/17840 [3:03:54<30:39:54, 6.89s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:58,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:58,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7562, 'learning_rate': 9.521971496437056e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:58,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:58,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:58,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1808/17840 [3:04:07<30:14:38, 6.79s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:08,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:08,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1809/17840 [3:04:14<30:09:38, 6.77s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1809/17840 [3:04:14<30:09:38, 6.77s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8306, 'learning_rate': 9.520783847980998e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:16,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1810/17840 [3:04:21<29:46:55, 6.69s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1810/17840 [3:04:21<29:46:55, 6.69s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6959, 'learning_rate': 9.520190023752969e-05, 'epoch': 2.03} + 10%|███████▍ | 1810/17840 [3:04:21<29:46:55, 6.69s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:24,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:24,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8119, 'learning_rate': 9.519596199524941e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:24,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:30,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:30,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7431, 'learning_rate': 9.519002375296913e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:30,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:30,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:30,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1813/17840 [3:04:40<28:47:20, 6.47s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:40,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:40,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:40,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1814/17840 [3:04:46<28:33:53, 6.42s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:46,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:46,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:46,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1815/17840 [3:04:52<28:18:21, 6.36s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:52,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:52,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:52,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1816/17840 [3:04:58<28:01:49, 6.30s/it]g-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:58,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:58,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:58,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:39,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [3:05:04<27:37:02, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [3:05:04<27:37:02, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [3:05:04<27:37:02, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [3:05:04<27:37:02, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1818/17840 [3:05:10<27:11:15, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:10,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:10,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:10,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:03,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1819/17840 [3:05:16<26:46:55, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1819/17840 [3:05:16<26:46:55, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:19,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:19,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.46, 'learning_rate': 9.514251781472685e-05, 'epoch': 2.04} +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:23,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1821/17840 [3:05:27<25:52:58, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:26,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1821/17840 [3:05:27<25:52:58, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:26,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8716, 'learning_rate': 9.513657957244656e-05, 'epoch': 2.04} + 10%|███████▍ | 1821/17840 [3:05:27<25:52:58, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:26,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1821/17840 [3:05:27<25:52:58, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:26,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1822/17840 [3:05:33<25:12:22, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:33,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1823/17840 [3:05:38<24:25:57, 5.49s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1823/17840 [3:05:38<24:25:57, 5.49s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:37,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:40,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:40,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7342, 'learning_rate': 9.51187648456057e-05, 'epoch': 2.04} +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:43,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1825/17840 [3:05:50<25:37:34, 5.76s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1825/17840 [3:05:50<25:37:34, 5.76s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:49,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:51,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:51,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:53,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:53,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:55,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:57,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:57,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:59,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:02,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:02,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:04,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:04,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:06,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:08,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:08,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:10,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:10,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:12,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:12,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:13,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:13,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:16,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:16,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:20,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:20,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:20,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:23,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:23,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:27,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:27,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:27,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:31,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:31,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:36,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:36,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1837/17840 [3:06:41<26:13:12, 5.90s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1837/17840 [3:06:41<26:13:12, 5.90s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1837/17840 [3:06:41<26:13:12, 5.90s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1837/17840 [3:06:41<26:13:12, 5.90s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1837/17840 [3:06:41<26:13:12, 5.90s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:49<28:07:38, 6.33s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:49<28:07:38, 6.33s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:49<28:07:38, 6.33s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:53,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:53,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0562, 'learning_rate': 9.502969121140143e-05, 'epoch': 2.06} +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:53,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:53,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:53,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:07:03<30:19:11, 6.82s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:07:03<30:19:11, 6.82s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:07:03<30:19:11, 6.82s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:07:03<30:19:11, 6.82s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:07:03<30:19:11, 6.82s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1841/17840 [3:07:11<30:51:34, 6.94s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:11,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:11,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:11,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1842/17840 [3:07:18<31:10:11, 7.01s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1842/17840 [3:07:18<31:10:11, 7.01s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1842/17840 [3:07:18<31:10:11, 7.01s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1842/17840 [3:07:18<31:10:11, 7.01s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1842/17840 [3:07:18<31:10:11, 7.01s/it]g-point operations will not be computed-17 19:46:31,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [3:07:25<31:22:41, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [3:07:25<31:22:41, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [3:07:25<31:22:41, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [3:07:25<31:22:41, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [3:07:32<31:27:51, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [3:07:32<31:27:51, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [3:07:32<31:27:51, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:36,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:36,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7366, 'learning_rate': 9.499406175771973e-05, 'epoch': 2.07} +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:36,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:36,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:36,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1846/17840 [3:07:46<31:15:19, 7.04s/it]g-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1846/17840 [3:07:46<31:15:19, 7.04s/it]g-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:48,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1847/17840 [3:07:53<31:06:43, 7.00s/it]g-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1847/17840 [3:07:53<31:06:43, 7.00s/it]g-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0892, 'learning_rate': 9.498218527315915e-05, 'epoch': 2.07} + 10%|███████▌ | 1847/17840 [3:07:53<31:06:43, 7.00s/it]g-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1847/17840 [3:07:53<31:06:43, 7.00s/it]g-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1847/17840 [3:07:53<31:06:43, 7.00s/it]g-point operations will not be computed-17 19:48:24,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1848/17840 [3:08:00<30:56:17, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1848/17840 [3:08:00<30:56:17, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1848/17840 [3:08:00<30:56:17, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [3:08:07<30:47:37, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [3:08:07<30:47:37, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9146, 'learning_rate': 9.497030878859858e-05, 'epoch': 2.07} + 10%|███████▌ | 1849/17840 [3:08:07<30:47:37, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [3:08:07<30:47:37, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [3:08:07<30:47:37, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1850/17840 [3:08:16<33:50:50, 7.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:16,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:16,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:16,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1851/17840 [3:08:23<32:51:19, 7.40s/it]g-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1851/17840 [3:08:23<32:51:19, 7.40s/it]g-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:25,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:08:29<31:58:03, 7.20s/it]g-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:08:29<31:58:03, 7.20s/it]g-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0244, 'learning_rate': 9.495249406175773e-05, 'epoch': 2.08} + 10%|███████▌ | 1852/17840 [3:08:29<31:58:03, 7.20s/it]g-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:08:29<31:58:03, 7.20s/it]g-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:08:29<31:58:03, 7.20s/it]g-point operations will not be computed-17 19:48:59,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:08:36<31:20:15, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:08:36<31:20:15, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:08:36<31:20:15, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:08:36<31:20:15, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1854/17840 [3:08:43<30:55:15, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:43,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:43,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1855/17840 [3:08:50<30:36:53, 6.89s/it]g-point operations will not be computed-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1855/17840 [3:08:50<30:36:53, 6.89s/it]g-point operations will not be computed-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0276, 'learning_rate': 9.493467933491686e-05, 'epoch': 2.08} + 10%|███████▌ | 1855/17840 [3:08:50<30:36:53, 6.89s/it]g-point operations will not be computed-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1855/17840 [3:08:50<30:36:53, 6.89s/it]g-point operations will not be computed-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1855/17840 [3:08:50<30:36:53, 6.89s/it]g-point operations will not be computed-17 19:49:35,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:08:56<30:22:03, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:08:56<30:22:03, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:08:56<30:22:03, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:08:56<30:22:03, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1857/17840 [3:09:03<30:01:23, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:03,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:03,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:03,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1858/17840 [3:09:09<29:40:39, 6.69s/it]g-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:10,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:10,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1859/17840 [3:09:16<29:21:19, 6.61s/it]g-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1859/17840 [3:09:16<29:21:19, 6.61s/it]g-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9975, 'learning_rate': 9.491092636579573e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:18,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1860/17840 [3:09:23<29:22:17, 6.62s/it]g-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1860/17840 [3:09:23<29:22:17, 6.62s/it]g-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7912, 'learning_rate': 9.490498812351545e-05, 'epoch': 2.09} + 10%|███████▌ | 1860/17840 [3:09:23<29:22:17, 6.62s/it]g-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8219, 'learning_rate': 9.489904988123516e-05, 'epoch': 2.09} +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:55,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1862/17840 [3:09:35<28:46:39, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1862/17840 [3:09:35<28:46:39, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1862/17840 [3:09:35<28:46:39, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1862/17840 [3:09:35<28:46:39, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1863/17840 [3:09:42<28:36:10, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:42,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:42,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:42,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1864/17840 [3:09:48<28:21:41, 6.39s/it]g-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:48,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:48,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:48,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1865/17840 [3:09:54<28:05:19, 6.33s/it]g-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:54,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:54,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:54,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1866/17840 [3:10:00<27:48:18, 6.27s/it]g-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:00,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:00,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:00,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:34,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:10:06<27:23:41, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:05,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:10:06<27:23:41, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:05,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:10:06<27:23:41, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:05,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:10:06<27:23:41, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:05,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1868/17840 [3:10:12<26:57:43, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1868/17840 [3:10:12<26:57:43, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:15,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:15,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8204, 'learning_rate': 9.485154394299288e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:19,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1870/17840 [3:10:23<26:00:19, 5.86s/it]g-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1870/17840 [3:10:23<26:00:19, 5.86s/it]g-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6991, 'learning_rate': 9.484560570071259e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:25,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1871/17840 [3:10:29<25:40:33, 5.79s/it]g-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1871/17840 [3:10:29<25:40:33, 5.79s/it]g-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:29,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:31,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:31,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6995, 'learning_rate': 9.483372921615203e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:35,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1873/17840 [3:10:40<24:38:59, 5.56s/it]g-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1873/17840 [3:10:40<24:38:59, 5.56s/it]g-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:39,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:39,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:39,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:10,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1874/17840 [3:10:45<24:02:04, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:46,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1875/17840 [3:10:52<26:25:30, 5.96s/it]g-point operations will not be computed-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1875/17840 [3:10:52<26:25:30, 5.96s/it]g-point operations will not be computed-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:51,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:54,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:54,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8188, 'learning_rate': 9.480997624703088e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:57,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:43,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1877/17840 [3:11:01<23:20:45, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:59,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1877/17840 [3:11:01<23:20:45, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:59,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:01,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:59,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1878/17840 [3:11:05<21:51:56, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:03,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1878/17840 [3:11:05<21:51:56, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:03,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:05,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:03,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1879/17840 [3:11:09<20:24:28, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:07,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1879/17840 [3:11:09<20:24:28, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:07,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1880/17840 [3:11:13<19:03:44, 4.30s/it]g-point operations will not be computed-17 19:52:07,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1880/17840 [3:11:13<19:03:44, 4.30s/it]g-point operations will not be computed-17 19:52:07,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1880/17840 [3:11:13<19:03:44, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:11,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1881/17840 [3:11:16<17:37:18, 3.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:14,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1881/17840 [3:11:16<17:37:18, 3.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:14,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1882/17840 [3:11:19<16:10:27, 3.65s/it]g-point operations will not be computed-17 19:52:14,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1882/17840 [3:11:19<16:10:27, 3.65s/it]g-point operations will not be computed-17 19:52:14,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:18,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:17,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:20,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:19,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:20,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:19,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:11:24<13:17:26, 3.00s/it]g-point operations will not be computed-17 19:52:19,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:11:24<13:17:26, 3.00s/it]g-point operations will not be computed-17 19:52:19,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:11:24<13:17:26, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:23,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:11:24<13:17:26, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:23,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:27,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:23,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:27,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:23,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:11:32<19:37:56, 4.43s/it]g-point operations will not be computed-17 19:52:23,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:11:32<19:37:56, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:34,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:11:39<23:48:52, 5.37s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:11:39<23:48:52, 5.37s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.907, 'learning_rate': 9.475059382422803e-05, 'epoch': 2.11} + 11%|███████▋ | 1886/17840 [3:11:39<23:48:52, 5.37s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:11:39<23:48:52, 5.37s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1887/17840 [3:11:47<26:36:51, 6.01s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1887/17840 [3:11:47<26:36:51, 6.01s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0734, 'learning_rate': 9.474465558194775e-05, 'epoch': 2.12} + 11%|███████▋ | 1887/17840 [3:11:47<26:36:51, 6.01s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1887/17840 [3:11:47<26:36:51, 6.01s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1888/17840 [3:11:54<28:28:01, 6.42s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1888/17840 [3:11:54<28:28:01, 6.42s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:55,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:55,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1889/17840 [3:12:01<29:39:44, 6.69s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1889/17840 [3:12:01<29:39:44, 6.69s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7925, 'learning_rate': 9.473277909738718e-05, 'epoch': 2.12} + 11%|███████▋ | 1889/17840 [3:12:01<29:39:44, 6.69s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1889/17840 [3:12:01<29:39:44, 6.69s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1890/17840 [3:12:09<30:22:26, 6.86s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1890/17840 [3:12:09<30:22:26, 6.86s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7958, 'learning_rate': 9.472684085510688e-05, 'epoch': 2.12} +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:11,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:12:16<30:44:07, 6.94s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:12:16<30:44:07, 6.94s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9545, 'learning_rate': 9.472090261282662e-05, 'epoch': 2.12} + 11%|███████▋ | 1891/17840 [3:12:16<30:44:07, 6.94s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:12:16<30:44:07, 6.94s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1892/17840 [3:12:23<31:00:45, 7.00s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1892/17840 [3:12:23<31:00:45, 7.00s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8051, 'learning_rate': 9.471496437054632e-05, 'epoch': 2.12} + 11%|███████▋ | 1892/17840 [3:12:23<31:00:45, 7.00s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:27,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:27,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.999, 'learning_rate': 9.470902612826605e-05, 'epoch': 2.12} +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:27,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:27,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1894/17840 [3:12:37<31:12:07, 7.04s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1894/17840 [3:12:37<31:12:07, 7.04s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:38,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:38,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:38,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1895/17840 [3:12:44<31:05:36, 7.02s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1895/17840 [3:12:44<31:05:36, 7.02s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1895/17840 [3:12:44<31:05:36, 7.02s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7052, 'learning_rate': 9.469121140142518e-05, 'epoch': 2.13} +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1897/17840 [3:12:58<30:48:57, 6.96s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1897/17840 [3:12:58<30:48:57, 6.96s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:00,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:00,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:13:05<30:49:58, 6.96s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:13:05<30:49:58, 6.96s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:13:05<30:49:58, 6.96s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9934, 'learning_rate': 9.467339667458433e-05, 'epoch': 2.13} +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:09,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:13:21<33:34:14, 7.58s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:13:21<33:34:14, 7.58s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:13:21<33:34:14, 7.58s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:13:21<33:34:14, 7.58s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:13:21<33:34:14, 7.58s/it]g-point operations will not be computed-17 19:52:30,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:13:28<32:37:09, 7.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:13:28<32:37:09, 7.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:13:28<32:37:09, 7.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:13:28<32:37:09, 7.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1902/17840 [3:13:34<31:58:17, 7.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1902/17840 [3:13:34<31:58:17, 7.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:36,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:36,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1903/17840 [3:13:41<31:22:34, 7.09s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1903/17840 [3:13:41<31:22:34, 7.09s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1903/17840 [3:13:41<31:22:34, 7.09s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:45,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:45,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.624, 'learning_rate': 9.46437054631829e-05, 'epoch': 2.13} +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:45,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:45,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:45,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1905/17840 [3:13:54<30:20:14, 6.85s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:55,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:55,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:55,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1906/17840 [3:14:01<30:04:16, 6.79s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1906/17840 [3:14:01<30:04:16, 6.79s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:03,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:03,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:14:08<29:50:38, 6.74s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:14:08<29:50:38, 6.74s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:14:08<29:50:38, 6.74s/it]g-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:11,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:11,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0331, 'learning_rate': 9.461995249406176e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:11,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:11,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:11,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:54:26,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:14:21<29:27:32, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:14:21<29:27:32, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:14:21<29:27:32, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:14:21<29:27:32, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1910/17840 [3:14:27<29:03:53, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:27,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:27,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:27,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1911/17840 [3:14:34<28:48:15, 6.51s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1911/17840 [3:14:34<28:48:15, 6.51s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:35,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:35,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1912/17840 [3:14:40<28:29:56, 6.44s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1912/17840 [3:14:40<28:29:56, 6.44s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:42,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:42,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1913/17840 [3:14:46<28:09:42, 6.37s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1913/17840 [3:14:46<28:09:42, 6.37s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:48,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:48,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1914/17840 [3:14:52<27:51:08, 6.30s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1914/17840 [3:14:52<27:51:08, 6.30s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:54,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:54,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1915/17840 [3:14:58<27:30:45, 6.22s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1915/17840 [3:14:58<27:30:45, 6.22s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:00,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:00,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1916/17840 [3:15:04<27:11:49, 6.15s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:04,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:04,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:04,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1917/17840 [3:15:10<26:45:11, 6.05s/it]g-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:10,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:10,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:10,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:20,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1918/17840 [3:15:16<26:25:32, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1918/17840 [3:15:16<26:25:32, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:19,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:19,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7275, 'learning_rate': 9.455463182897863e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:19,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:24,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:24,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8443, 'learning_rate': 9.454869358669835e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:28,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:28,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:14,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1921/17840 [3:15:33<25:09:32, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1921/17840 [3:15:33<25:09:32, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:35,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:35,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6619, 'learning_rate': 9.453681710213777e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:39,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:39,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1923/17840 [3:15:43<23:52:56, 5.40s/it]g-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:42,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:45,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:45,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:47,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:47,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:47,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:31,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1925/17840 [3:15:55<25:16:08, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:53,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:55,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:53,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:55,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:53,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1926/17840 [3:15:59<23:32:03, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:57,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:59,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:57,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:59,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:57,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1927/17840 [3:16:03<21:53:29, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:01,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:03,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:01,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:03,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:01,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1928/17840 [3:16:07<20:22:45, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:05,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1929/17840 [3:16:10<18:51:55, 4.27s/it]g-point operations will not be computed-17 19:57:05,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1929/17840 [3:16:10<18:51:55, 4.27s/it]g-point operations will not be computed-17 19:57:05,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1929/17840 [3:16:10<18:51:55, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:08,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1930/17840 [3:16:14<17:25:29, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:11,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1930/17840 [3:16:14<17:25:29, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:11,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1931/17840 [3:16:16<15:57:04, 3.61s/it]g-point operations will not be computed-17 19:57:11,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1931/17840 [3:16:16<15:57:04, 3.61s/it]g-point operations will not be computed-17 19:57:11,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:15,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:14,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:15,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:14,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1932/17840 [3:16:19<14:34:06, 3.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:17,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1932/17840 [3:16:19<14:34:06, 3.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:17,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1933/17840 [3:16:21<13:23:23, 3.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:19,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1934/17840 [3:16:24<12:12:39, 2.76s/it]g-point operations will not be computed-17 19:57:19,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1934/17840 [3:16:24<12:12:39, 2.76s/it]g-point operations will not be computed-17 19:57:19,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1934/17840 [3:16:24<12:12:39, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:23,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1934/17840 [3:16:24<12:12:39, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:23,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:27,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:23,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1935/17840 [3:16:32<19:10:05, 4.34s/it]g-point operations will not be computed-17 19:57:23,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1935/17840 [3:16:32<19:10:05, 4.34s/it]g-point operations will not be computed-17 19:57:23,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1935/17840 [3:16:32<19:10:05, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1935/17840 [3:16:32<19:10:05, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:34,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:34,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1936/17840 [3:16:39<23:30:34, 5.32s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1936/17840 [3:16:39<23:30:34, 5.32s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:42,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1937/17840 [3:16:47<26:16:26, 5.95s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1937/17840 [3:16:47<26:16:26, 5.95s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7427, 'learning_rate': 9.44477434679335e-05, 'epoch': 2.17} + 11%|███████▉ | 1937/17840 [3:16:47<26:16:26, 5.95s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1937/17840 [3:16:47<26:16:26, 5.95s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1938/17840 [3:16:54<28:14:56, 6.40s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1938/17840 [3:16:54<28:14:56, 6.40s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0508, 'learning_rate': 9.444180522565322e-05, 'epoch': 2.17} + 11%|███████▉ | 1938/17840 [3:16:54<28:14:56, 6.40s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:58,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:58,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9649, 'learning_rate': 9.443586698337292e-05, 'epoch': 2.17} +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:58,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:58,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1940/17840 [3:17:09<30:16:50, 6.86s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1940/17840 [3:17:09<30:16:50, 6.86s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9661, 'learning_rate': 9.442992874109264e-05, 'epoch': 2.17} + 11%|███████▉ | 1940/17840 [3:17:09<30:16:50, 6.86s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1940/17840 [3:17:09<30:16:50, 6.86s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:17:16<30:49:21, 6.98s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:17:16<30:49:21, 6.98s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:16,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:16,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:17:23<31:07:57, 7.05s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:17:23<31:07:57, 7.05s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8938, 'learning_rate': 9.441805225653207e-05, 'epoch': 2.18} + 11%|███████▉ | 1942/17840 [3:17:23<31:07:57, 7.05s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:17:23<31:07:57, 7.05s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:17:23<31:07:57, 7.05s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:17:30<31:23:45, 7.11s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:31,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:31,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1944/17840 [3:17:37<31:22:47, 7.11s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1944/17840 [3:17:37<31:22:47, 7.11s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7306, 'learning_rate': 9.440617577197151e-05, 'epoch': 2.18} + 11%|███████▉ | 1944/17840 [3:17:37<31:22:47, 7.11s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1944/17840 [3:17:37<31:22:47, 7.11s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1945/17840 [3:17:44<31:14:43, 7.08s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1945/17840 [3:17:44<31:14:43, 7.08s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:45,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:45,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:17:51<31:09:25, 7.06s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:17:51<31:09:25, 7.06s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9197, 'learning_rate': 9.439429928741093e-05, 'epoch': 2.18} + 11%|███████▉ | 1946/17840 [3:17:51<31:09:25, 7.06s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:17:51<31:09:25, 7.06s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:17:51<31:09:25, 7.06s/it]g-point operations will not be computed-17 19:57:30,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1947/17840 [3:17:59<31:09:53, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1947/17840 [3:17:59<31:09:53, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1947/17840 [3:17:59<31:09:53, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:18:05<31:01:01, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:18:05<31:01:01, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6882, 'learning_rate': 9.438242280285035e-05, 'epoch': 2.18} + 11%|███████▉ | 1948/17840 [3:18:05<31:01:01, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:09,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:09,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.188, 'learning_rate': 9.437648456057007e-05, 'epoch': 2.18} +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:09,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:09,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:09,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1950/17840 [3:18:22<33:52:48, 7.68s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:22,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:22,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:22,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1951/17840 [3:18:29<32:51:11, 7.44s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1951/17840 [3:18:29<32:51:11, 7.44s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1951/17840 [3:18:29<32:51:11, 7.44s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:32,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:32,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.644, 'learning_rate': 9.435866983372922e-05, 'epoch': 2.19} +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:32,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:32,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:32,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1953/17840 [3:18:42<31:20:58, 7.10s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:42,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:42,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:42,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1954/17840 [3:18:49<30:50:52, 6.99s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1954/17840 [3:18:49<30:50:52, 6.99s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1954/17840 [3:18:49<30:50:52, 6.99s/it]g-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:52,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:52,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7997, 'learning_rate': 9.434085510688837e-05, 'epoch': 2.19} +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:52,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:52,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:52,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:57,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1956/17840 [3:19:02<29:59:49, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1956/17840 [3:19:02<29:59:49, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1956/17840 [3:19:02<29:59:49, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1956/17840 [3:19:02<29:59:49, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:19:09<29:52:56, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:09,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:09,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:09,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1958/17840 [3:19:15<29:39:32, 6.72s/it]g-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1958/17840 [3:19:15<29:39:32, 6.72s/it]g-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:17,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1959/17840 [3:19:22<29:21:29, 6.66s/it]g-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1959/17840 [3:19:22<29:21:29, 6.66s/it]g-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6141, 'learning_rate': 9.431710213776722e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:24,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1960/17840 [3:19:28<29:00:31, 6.58s/it]g-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1960/17840 [3:19:28<29:00:31, 6.58s/it]g-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0426, 'learning_rate': 9.431116389548694e-05, 'epoch': 2.2} + 11%|████████ | 1960/17840 [3:19:28<29:00:31, 6.58s/it]g-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:32,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:32,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6638, 'learning_rate': 9.430522565320665e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:32,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:32,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:32,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:01,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:19:41<28:29:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:40,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:19:41<28:29:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:40,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:19:41<28:29:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:40,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:19:41<28:29:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:40,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1963/17840 [3:19:47<28:10:01, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:46,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1963/17840 [3:19:47<28:10:01, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:46,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1963/17840 [3:19:47<28:10:01, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:46,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1963/17840 [3:19:47<28:10:01, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:46,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1964/17840 [3:19:53<27:57:11, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1964/17840 [3:19:53<27:57:11, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1964/17840 [3:19:53<27:57:11, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1964/17840 [3:19:53<27:57:11, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1965/17840 [3:20:00<27:45:21, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:00,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:00,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:00,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1966/17840 [3:20:06<27:33:20, 6.25s/it]g-point operations will not be computed-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:06,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:06,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:06,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:00:52,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1967/17840 [3:20:12<27:08:38, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:10,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1967/17840 [3:20:12<27:08:38, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:10,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1967/17840 [3:20:12<27:08:38, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:10,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1967/17840 [3:20:12<27:08:38, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:10,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1968/17840 [3:20:18<26:44:55, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1968/17840 [3:20:18<26:44:55, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:20,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:20,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0762, 'learning_rate': 9.425771971496437e-05, 'epoch': 2.21} +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:24,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1970/17840 [3:20:29<25:47:11, 5.85s/it]g-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1970/17840 [3:20:29<25:47:11, 5.85s/it]g-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:29,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:29,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:29,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:16,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1971/17840 [3:20:34<25:18:32, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1971/17840 [3:20:34<25:18:32, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:37,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:37,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6304, 'learning_rate': 9.423990498812352e-05, 'epoch': 2.21} +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:41,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1973/17840 [3:20:45<24:24:01, 5.54s/it]g-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1973/17840 [3:20:45<24:24:01, 5.54s/it]g-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:45,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:45,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:45,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:33,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1974/17840 [3:20:50<23:47:53, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:51,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1975/17840 [3:20:57<25:53:29, 5.88s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1975/17840 [3:20:57<25:53:29, 5.88s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:56,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:59,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:59,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:01,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:03,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:03,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:05,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:07,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:07,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:09,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:10,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:10,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:12,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:12,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:14,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:17,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:17,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:19,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:19,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:21,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:21,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:23,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:23,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:24,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:24,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:28,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:31,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:31,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9739, 'learning_rate': 9.416270783847982e-05, 'epoch': 2.23} +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:35,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:35,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:39,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:39,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8944, 'learning_rate': 9.415676959619954e-05, 'epoch': 2.23} +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:39,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:39,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:39,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1987/17840 [3:21:49<25:56:50, 5.89s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1987/17840 [3:21:49<25:56:50, 5.89s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:52,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:21:57<27:44:37, 6.30s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:21:57<27:44:37, 6.30s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0155, 'learning_rate': 9.414489311163895e-05, 'epoch': 2.23} + 11%|████████▏ | 1988/17840 [3:21:57<27:44:37, 6.30s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:21:57<27:44:37, 6.30s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1989/17840 [3:22:04<29:06:32, 6.61s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1989/17840 [3:22:04<29:06:32, 6.61s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9818, 'learning_rate': 9.413895486935867e-05, 'epoch': 2.23} + 11%|████████▏ | 1989/17840 [3:22:04<29:06:32, 6.61s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:08,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:08,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7809, 'learning_rate': 9.413301662707839e-05, 'epoch': 2.23} +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:08,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:08,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1991/17840 [3:22:19<30:39:45, 6.96s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1991/17840 [3:22:19<30:39:45, 6.96s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1762, 'learning_rate': 9.412707838479811e-05, 'epoch': 2.23} + 11%|████████▏ | 1991/17840 [3:22:19<30:39:45, 6.96s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1991/17840 [3:22:19<30:39:45, 6.96s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1991/17840 [3:22:19<30:39:45, 6.96s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:22:26<30:56:00, 7.03s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:26,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:26,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1993/17840 [3:22:33<31:06:35, 7.07s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1993/17840 [3:22:33<31:06:35, 7.07s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6975, 'learning_rate': 9.411520190023754e-05, 'epoch': 2.23} + 11%|████████▏ | 1993/17840 [3:22:33<31:06:35, 7.07s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1993/17840 [3:22:33<31:06:35, 7.07s/it]g-point operations will not be computed-17 20:01:48,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:22:40<31:05:23, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:22:40<31:05:23, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8525, 'learning_rate': 9.410926365795725e-05, 'epoch': 2.24} + 11%|████████▏ | 1994/17840 [3:22:40<31:05:23, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1995/17840 [3:22:47<30:54:00, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1995/17840 [3:22:47<30:54:00, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8146, 'learning_rate': 9.410332541567697e-05, 'epoch': 2.24} + 11%|████████▏ | 1995/17840 [3:22:47<30:54:00, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:51,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:51,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8662, 'learning_rate': 9.409738717339667e-05, 'epoch': 2.24} +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:51,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:51,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1997/17840 [3:23:01<30:42:32, 6.98s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1997/17840 [3:23:01<30:42:32, 6.98s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8151, 'learning_rate': 9.409144893111639e-05, 'epoch': 2.24} + 11%|████████▏ | 1997/17840 [3:23:01<30:42:32, 6.98s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:05,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:05,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6374, 'learning_rate': 9.408551068883611e-05, 'epoch': 2.24} +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:05,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:05,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:05,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1999/17840 [3:23:15<30:32:48, 6.94s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:15,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:15,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:23:24<33:33:45, 7.63s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:23:24<33:33:45, 7.63s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7942, 'learning_rate': 9.407363420427554e-05, 'epoch': 2.24} + 11%|████████▏ | 2000/17840 [3:23:24<33:33:45, 7.63s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:23:24<33:33:45, 7.63s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:23:24<33:33:45, 7.63s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2001/17840 [3:23:31<32:32:41, 7.40s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:31,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:31,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2002/17840 [3:23:37<31:44:40, 7.22s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2002/17840 [3:23:37<31:44:40, 7.22s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6933, 'learning_rate': 9.406175771971497e-05, 'epoch': 2.24} + 11%|████████▏ | 2002/17840 [3:23:37<31:44:40, 7.22s/it]g-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:41,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:41,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8754, 'learning_rate': 9.405581947743467e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:41,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:41,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:41,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:39,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:23:51<30:40:34, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:23:51<30:40:34, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:23:51<30:40:34, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:23:58<30:19:03, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:23:58<30:19:03, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:58,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:58,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2006/17840 [3:24:04<30:07:21, 6.85s/it]g-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2006/17840 [3:24:04<30:07:21, 6.85s/it]g-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9494, 'learning_rate': 9.403800475059384e-05, 'epoch': 2.25} + 11%|████████▏ | 2006/17840 [3:24:04<30:07:21, 6.85s/it]g-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:08,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:08,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7468, 'learning_rate': 9.403206650831354e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:08,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:08,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:50,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2008/17840 [3:24:18<29:28:34, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2008/17840 [3:24:18<29:28:34, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9178, 'learning_rate': 9.402612826603325e-05, 'epoch': 2.25} + 11%|████████▏ | 2008/17840 [3:24:18<29:28:34, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2009/17840 [3:24:24<29:10:41, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2009/17840 [3:24:24<29:10:41, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:24,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:24,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2010/17840 [3:24:30<28:50:16, 6.56s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2010/17840 [3:24:30<28:50:16, 6.56s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:31,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:31,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2011/17840 [3:24:37<28:37:20, 6.51s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2011/17840 [3:24:37<28:37:20, 6.51s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8691, 'learning_rate': 9.400831353919241e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:39,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2012/17840 [3:24:43<28:25:20, 6.46s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2012/17840 [3:24:43<28:25:20, 6.46s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7748, 'learning_rate': 9.400237529691212e-05, 'epoch': 2.26} +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:45,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2013/17840 [3:24:49<28:07:58, 6.40s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2013/17840 [3:24:49<28:07:58, 6.40s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8343, 'learning_rate': 9.399643705463184e-05, 'epoch': 2.26} + 11%|████████▏ | 2013/17840 [3:24:49<28:07:58, 6.40s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|██████���█▏ | 2013/17840 [3:24:49<28:07:58, 6.40s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:53,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:53,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:57,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2015/17840 [3:25:02<27:40:18, 6.29s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2015/17840 [3:25:02<27:40:18, 6.29s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1294, 'learning_rate': 9.398456057007126e-05, 'epoch': 2.26} +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:03,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2016/17840 [3:25:08<27:32:12, 6.26s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2016/17840 [3:25:08<27:32:12, 6.26s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5789, 'learning_rate': 9.397862232779097e-05, 'epoch': 2.26} + 11%|████████▏ | 2016/17840 [3:25:08<27:32:12, 6.26s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:11,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:11,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9848, 'learning_rate': 9.397268408551069e-05, 'epoch': 2.26} +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:11,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:11,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:17,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:17,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:21,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:21,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2019/17840 [3:25:26<26:31:34, 6.04s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2019/17840 [3:25:26<26:31:34, 6.04s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:27,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:27,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2020/17840 [3:25:32<26:03:39, 5.93s/it]g-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:16,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2021/17840 [3:25:37<25:36:37, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2021/17840 [3:25:37<25:36:37, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2021/17840 [3:25:37<25:36:37, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:39,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:39,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:43,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:43,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2023/17840 [3:25:48<24:26:52, 5.56s/it]g-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:47,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:47,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:52,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:52,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:52,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:35,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2025/17840 [3:26:00<25:34:36, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:58,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:00,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:58,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:00,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:58,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2026/17840 [3:26:04<23:47:01, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:07:02,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:04,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:02,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:04,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:02,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2027/17840 [3:26:08<22:09:05, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:08,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:08,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2028/17840 [3:26:12<20:42:13, 4.71s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:11,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:11,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:13,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:13,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:16,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:17,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:17,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:19,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:19,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:21,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:21,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:24,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7621, 'learning_rate': 9.387173396674584e-05, 'epoch': 2.28} +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:30,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:30,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:30,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:34,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:34,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:38,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:38,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:38,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:41,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:41,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:41,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:41,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:41,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:26:52<26:12:38, 5.97s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:26:52<26:12:38, 5.97s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:55,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:27:00<28:13:30, 6.43s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:27:00<28:13:30, 6.43s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6884, 'learning_rate': 9.384798099762471e-05, 'epoch': 2.28} + 11%|████████▎ | 2038/17840 [3:27:00<28:13:30, 6.43s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:27:00<28:13:30, 6.43s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:27:00<28:13:30, 6.43s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:27:07<29:31:02, 6.73s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:27:07<29:31:02, 6.73s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:27:07<29:31:02, 6.73s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:27:07<29:31:02, 6.73s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:27:07<29:31:02, 6.73s/it]g-point operations will not be computed-17 20:07:06,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:27:14<30:17:50, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:27:14<30:17:50, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:27:14<30:17:50, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2041/17840 [3:27:22<30:55:56, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2041/17840 [3:27:22<30:55:56, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.671, 'learning_rate': 9.383016627078384e-05, 'epoch': 2.29} + 11%|████████▎ | 2041/17840 [3:27:22<30:55:56, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2041/17840 [3:27:22<30:55:56, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2041/17840 [3:27:22<30:55:56, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:27:29<31:23:30, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:27:29<31:23:30, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:31,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:27:36<31:30:41, 7.18s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:27:36<31:30:41, 7.18s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8985, 'learning_rate': 9.381828978622329e-05, 'epoch': 2.29} + 11%|████████▎ | 2043/17840 [3:27:36<31:30:41, 7.18s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:27:36<31:30:41, 7.18s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:27:36<31:30:41, 7.18s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:44<31:33:26, 7.19s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:44<31:33:26, 7.19s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:44<31:33:26, 7.19s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:48,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:48,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8035, 'learning_rate': 9.380641330166271e-05, 'epoch': 2.29} +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:48,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:48,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:48,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:58<31:15:45, 7.13s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:58<31:15:45, 7.13s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:58<31:15:45, 7.13s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:02,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:02,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1396, 'learning_rate': 9.379453681710214e-05, 'epoch': 2.29} +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:02,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:02,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:02,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:28:12<30:59:04, 7.06s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:12,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:12,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2049/17840 [3:28:19<30:48:37, 7.02s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2049/17840 [3:28:19<30:48:37, 7.02s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0296, 'learning_rate': 9.378266033254157e-05, 'epoch': 2.3} + 11%|████████▍ | 2049/17840 [3:28:19<30:48:37, 7.02s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2049/17840 [3:28:19<30:48:37, 7.02s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2049/17840 [3:28:19<30:48:37, 7.02s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2050/17840 [3:28:28<33:46:18, 7.70s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:28,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:28,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2051/17840 [3:28:35<32:48:11, 7.48s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2051/17840 [3:28:35<32:48:11, 7.48s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7552, 'learning_rate': 9.377078384798101e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:37,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2052/17840 [3:28:42<31:56:31, 7.28s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2052/17840 [3:28:42<31:56:31, 7.28s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9854, 'learning_rate': 9.376484560570071e-05, 'epoch': 2.3} + 12%|████████▍ | 2052/17840 [3:28:42<31:56:31, 7.28s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2052/17840 [3:28:42<31:56:31, 7.28s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2052/17840 [3:28:42<31:56:31, 7.28s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2053/17840 [3:28:48<31:13:17, 7.12s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:49,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:49,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2054/17840 [3:28:55<30:40:58, 7.00s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2054/17840 [3:28:55<30:40:58, 7.00s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9509, 'learning_rate': 9.375296912114014e-05, 'epoch': 2.3} + 12%|████████▍ | 2054/17840 [3:28:55<30:40:58, 7.00s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:59,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:59,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.899, 'learning_rate': 9.374703087885986e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:59,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:59,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:59,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2056/17840 [3:29:09<30:13:24, 6.89s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:09,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:09,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2057/17840 [3:29:15<29:53:24, 6.82s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2057/17840 [3:29:15<29:53:24, 6.82s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6835, 'learning_rate': 9.373515439429929e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:17,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2058/17840 [3:29:22<29:39:07, 6.76s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2058/17840 [3:29:22<29:39:07, 6.76s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6567, 'learning_rate': 9.372921615201901e-05, 'epoch': 2.31} + 12%|████████▍ | 2058/17840 [3:29:22<29:39:07, 6.76s/it]g-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:25,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:25,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1262, 'learning_rate': 9.372327790973873e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:25,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9484, 'learning_rate': 9.371733966745844e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:13,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2061/17840 [3:29:41<28:49:45, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:40,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2061/17840 [3:29:41<28:49:45, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:40,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2061/17840 [3:29:41<28:49:45, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:40,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:29:48<28:29:38, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:29:48<28:29:38, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8441, 'learning_rate': 9.370546318289786e-05, 'epoch': 2.31} + 12%|████████▍ | 2062/17840 [3:29:48<28:29:38, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:29:54<28:09:49, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:29:54<28:09:49, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:54,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:54,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2064/17840 [3:30:00<27:58:41, 6.38s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2064/17840 [3:30:00<27:58:41, 6.38s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2986, 'learning_rate': 9.36935866983373e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:02,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:30:07<27:48:50, 6.35s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:30:07<27:48:50, 6.35s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8482, 'learning_rate': 9.368764845605701e-05, 'epoch': 2.32} +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:08,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2066/17840 [3:30:13<27:34:25, 6.29s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2066/17840 [3:30:13<27:34:25, 6.29s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5889, 'learning_rate': 9.368171021377673e-05, 'epoch': 2.32} +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:14,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:30:19<27:17:41, 6.23s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:30:19<27:17:41, 6.23s/it]g-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:19,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:19,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:10:46,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2068/17840 [3:30:25<26:47:40, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2068/17840 [3:30:25<26:47:40, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6293, 'learning_rate': 9.366983372921616e-05, 'epoch': 2.32} + 12%|████████▍ | 2068/17840 [3:30:25<26:47:40, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2069/17840 [3:30:30<26:18:53, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2069/17840 [3:30:30<26:18:53, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:30,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:30,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:30,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:23,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2070/17840 [3:30:36<25:59:00, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2070/17840 [3:30:36<25:59:00, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:39,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:39,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:41,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:41,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2072/17840 [3:30:47<25:07:10, 5.74s/it]g-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2072/17840 [3:30:47<25:07:10, 5.74s/it]g-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:47,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:49,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:49,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6832, 'learning_rate': 9.364014251781473e-05, 'epoch': 2.32} +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:53,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:35,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2074/17840 [3:30:58<23:48:00, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:56,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2074/17840 [3:30:58<23:48:00, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:56,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5938, 'learning_rate': 9.363420427553444e-05, 'epoch': 2.33} + 12%|████████▍ | 2074/17840 [3:30:58<23:48:00, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:56,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2075/17840 [3:31:05<25:54:36, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:56,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2075/17840 [3:31:05<25:54:36, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:56,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:04,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:56,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:04,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:56,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2076/17840 [3:31:09<24:16:18, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:07,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2076/17840 [3:31:09<24:16:18, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:07,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:10,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:07,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2077/17840 [3:31:14<22:41:48, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:12,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2077/17840 [3:31:14<22:41:48, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:12,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:14,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:12,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2078/17840 [3:31:18<21:10:55, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:16,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2078/17840 [3:31:18<21:10:55, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:16,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:17,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:16,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:17,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:16,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2079/17840 [3:31:21<19:27:09, 4.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:19,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2080/17840 [3:31:24<17:46:52, 4.06s/it]g-point operations will not be computed-17 20:12:19,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2080/17840 [3:31:24<17:46:52, 4.06s/it]g-point operations will not be computed-17 20:12:19,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:23,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:22,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:23,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:22,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2081/17840 [3:31:27<16:14:27, 3.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:25,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2081/17840 [3:31:27<16:14:27, 3.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:25,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2082/17840 [3:31:30<14:42:54, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:27,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2082/17840 [3:31:30<14:42:54, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:27,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2083/17840 [3:31:32<13:21:13, 3.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:30,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2083/17840 [3:31:32<13:21:13, 3.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:30,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2084/17840 [3:31:34<12:05:44, 2.76s/it]g-point operations will not be computed-17 20:12:30,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|���███████▌ | 2084/17840 [3:31:34<12:05:44, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:33,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2084/17840 [3:31:34<12:05:44, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:33,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:37,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:33,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:37,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:33,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2085/17840 [3:31:42<18:38:02, 4.26s/it]g-point operations will not be computed-17 20:12:33,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2085/17840 [3:31:42<18:38:02, 4.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2085/17840 [3:31:42<18:38:02, 4.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:45,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2086/17840 [3:31:49<22:55:43, 5.24s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2086/17840 [3:31:49<22:55:43, 5.24s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:50,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:50,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:50,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:57<25:52:20, 5.91s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:57<25:52:20, 5.91s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:57<25:52:20, 5.91s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:57<25:52:20, 5.91s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:57<25:52:20, 5.91s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2088/17840 [3:32:04<27:46:47, 6.35s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2088/17840 [3:32:04<27:46:47, 6.35s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2088/17840 [3:32:04<27:46:47, 6.35s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:09,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:09,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6044, 'learning_rate': 9.354513064133016e-05, 'epoch': 2.34} +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:09,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:09,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:09,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:32:19<29:59:31, 6.86s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:32:19<29:59:31, 6.86s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:32:19<29:59:31, 6.86s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:32:19<29:59:31, 6.86s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:32:19<29:59:31, 6.86s/it]g-point operations will not be computed-17 20:12:41,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2091/17840 [3:32:26<30:24:31, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2091/17840 [3:32:26<30:24:31, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2091/17840 [3:32:26<30:24:31, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2091/17840 [3:32:26<30:24:31, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:32:33<30:39:49, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:32:33<30:39:49, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:32:33<30:39:49, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:32:33<30:39:49, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:32:33<30:39:49, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2093/17840 [3:32:40<30:44:28, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:41,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:41,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:41,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:48<30:52:01, 7.06s/it]g-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:48<30:52:01, 7.06s/it]g-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:48<30:52:01, 7.06s/it]g-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:48<30:52:01, 7.06s/it]g-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:48<30:52:01, 7.06s/it]g-point operations will not be computed-17 20:13:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2095/17840 [3:32:55<30:48:48, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2095/17840 [3:32:55<30:48:48, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2095/17840 [3:32:55<30:48:48, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2095/17840 [3:32:55<30:48:48, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2096/17840 [3:33:02<30:41:08, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2096/17840 [3:33:02<30:41:08, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:04,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:33:08<30:30:10, 6.98s/it]g-point operations will not be computed-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:33:08<30:30:10, 6.98s/it]g-point operations will not be computed-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2464, 'learning_rate': 9.34976247030879e-05, 'epoch': 2.35} + 12%|████████▌ | 2097/17840 [3:33:08<30:30:10, 6.98s/it]g-point operations will not be computed-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:33:08<30:30:10, 6.98s/it]g-point operations will not be computed-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:33:08<30:30:10, 6.98s/it]g-point operations will not be computed-17 20:13:53,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:33:15<30:19:54, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:33:15<30:19:54, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:33:15<30:19:54, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:33:22<30:17:16, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:33:22<30:17:16, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.74, 'learning_rate': 9.348574821852733e-05, 'epoch': 2.35} + 12%|████████▌ | 2099/17840 [3:33:22<30:17:16, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:33:22<30:17:16, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:33:31<33:24:39, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:33:31<33:24:39, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9428, 'learning_rate': 9.347980997624703e-05, 'epoch': 2.35} + 12%|████████▌ | 2100/17840 [3:33:31<33:24:39, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:33:31<33:24:39, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:33:31<33:24:39, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2101/17840 [3:33:38<32:24:37, 7.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2101/17840 [3:33:38<32:24:37, 7.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:40,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2102/17840 [3:33:45<31:33:26, 7.22s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2102/17840 [3:33:45<31:33:26, 7.22s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8479, 'learning_rate': 9.346793349168646e-05, 'epoch': 2.36} + 12%|████████▌ | 2102/17840 [3:33:45<31:33:26, 7.22s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:49,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:49,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8615, 'learning_rate': 9.346199524940618e-05, 'epoch': 2.36} +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:49,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:49,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:49,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2104/17840 [3:33:58<30:18:11, 6.93s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:59,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:59,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2105/17840 [3:34:05<29:55:40, 6.85s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2105/17840 [3:34:05<29:55:40, 6.85s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7793, 'learning_rate': 9.345011876484561e-05, 'epoch': 2.36} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:07,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2106/17840 [3:34:12<29:38:12, 6.78s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2106/17840 [3:34:12<29:38:12, 6.78s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8995, 'learning_rate': 9.344418052256533e-05, 'epoch': 2.36} + 12%|████████▌ | 2106/17840 [3:34:12<29:38:12, 6.78s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2106/17840 [3:34:12<29:38:12, 6.78s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2106/17840 [3:34:12<29:38:12, 6.78s/it]g-point operations will not be computed-17 20:14:14,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2107/17840 [3:34:18<29:29:35, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2107/17840 [3:34:18<29:29:35, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2107/17840 [3:34:18<29:29:35, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2108/17840 [3:34:25<29:10:14, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2108/17840 [3:34:25<29:10:14, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:25,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:25,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2109/17840 [3:34:31<28:44:58, 6.58s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2109/17840 [3:34:31<28:44:58, 6.58s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:31,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:31,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2110/17840 [3:34:38<28:35:14, 6.54s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2110/17840 [3:34:38<28:35:14, 6.54s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0071, 'learning_rate': 9.342042755344418e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:39,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2111/17840 [3:34:44<28:30:50, 6.53s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2111/17840 [3:34:44<28:30:50, 6.53s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8335, 'learning_rate': 9.34144893111639e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:46,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2112/17840 [3:34:50<28:12:51, 6.46s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2112/17840 [3:34:50<28:12:51, 6.46s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8886, 'learning_rate': 9.340855106888361e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:52,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2113/17840 [3:34:57<27:58:51, 6.41s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2113/17840 [3:34:57<27:58:51, 6.41s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8979, 'learning_rate': 9.340261282660333e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:58,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2114/17840 [3:35:03<27:49:54, 6.37s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2114/17840 [3:35:03<27:49:54, 6.37s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9612, 'learning_rate': 9.339667458432304e-05, 'epoch': 2.37} + 12%|████████▋ | 2114/17840 [3:35:03<27:49:54, 6.37s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:06,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:06,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8396, 'learning_rate': 9.339073634204276e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:06,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:12,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:12,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8095, 'learning_rate': 9.338479809976247e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:12,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:12,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:18,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:18,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:18,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:18,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:29,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:29,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2119/17840 [3:35:33<26:15:11, 6.01s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:33,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:33,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:33,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2120/17840 [3:35:39<25:50:17, 5.92s/it]g-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:39,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:39,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:39,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:17,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2121/17840 [3:35:44<25:27:03, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2121/17840 [3:35:44<25:27:03, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2121/17840 [3:35:44<25:27:03, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:47,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:47,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:51,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:51,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2123/17840 [3:35:55<24:28:20, 5.61s/it]g-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:55,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:57,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:57,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6052, 'learning_rate': 9.33372921615202e-05, 'epoch': 2.38} +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:01,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:01,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:43,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2125/17840 [3:36:07<25:55:43, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2125/17840 [3:36:07<25:55:43, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2125/17840 [3:36:07<25:55:43, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:09,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:11,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:11,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:13,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:15,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:15,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:17,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:19,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:19,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:21,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:24,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:24,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:25,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:25,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:27,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:27,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:29,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:32,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:32,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:34,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:34,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1162, 'learning_rate': 9.327790973871734e-05, 'epoch': 2.39} +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:38,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:38,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:42,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:42,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8473, 'learning_rate': 9.327197149643706e-05, 'epoch': 2.39} +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:46,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:46,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:46,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:49,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:49,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:49,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:49,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:49,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2137/17840 [3:37:00<25:52:07, 5.93s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:01,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:01,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:37:07<27:47:00, 6.37s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:37:07<27:47:00, 6.37s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8124, 'learning_rate': 9.32541567695962e-05, 'epoch': 2.4} + 12%|████████▋ | 2138/17840 [3:37:07<27:47:00, 6.37s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:37:07<27:47:00, 6.37s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:37:07<27:47:00, 6.37s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:37:15<29:03:04, 6.66s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:37:15<29:03:04, 6.66s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:37:15<29:03:04, 6.66s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:19,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:19,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8877, 'learning_rate': 9.324228028503563e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:19,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:19,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:37:29<30:18:14, 6.95s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:37:29<30:18:14, 6.95s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9763, 'learning_rate': 9.323634204275535e-05, 'epoch': 2.4} + 12%|████████▊ | 2141/17840 [3:37:29<30:18:14, 6.95s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:33,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:33,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3047, 'learning_rate': 9.323040380047506e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:33,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:33,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2143/17840 [3:37:43<30:49:54, 7.07s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2143/17840 [3:37:43<30:49:54, 7.07s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7642, 'learning_rate': 9.322446555819478e-05, 'epoch': 2.4} + 12%|████████▊ | 2143/17840 [3:37:43<30:49:54, 7.07s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:48,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:48,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9211, 'learning_rate': 9.32185273159145e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:48,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:48,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2145/17840 [3:37:58<30:50:41, 7.07s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2145/17840 [3:37:58<30:50:41, 7.07s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8282, 'learning_rate': 9.32125890736342e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:00,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2146/17840 [3:38:05<30:50:56, 7.08s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2146/17840 [3:38:05<30:50:56, 7.08s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9583, 'learning_rate': 9.320665083135393e-05, 'epoch': 2.41} + 12%|████████▊ | 2146/17840 [3:38:05<30:50:56, 7.08s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2146/17840 [3:38:05<30:50:56, 7.08s/it]g-point operations will not be computed-17 20:17:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2147/17840 [3:38:12<30:40:44, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2147/17840 [3:38:12<30:40:44, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1232, 'learning_rate': 9.320071258907363e-05, 'epoch': 2.41} + 12%|████████▊ | 2147/17840 [3:38:12<30:40:44, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:38:19<30:37:46, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:38:19<30:37:46, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8734, 'learning_rate': 9.319477434679335e-05, 'epoch': 2.41} + 12%|████████▊ | 2148/17840 [3:38:19<30:37:46, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:38:19<30:37:46, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2149/17840 [3:38:26<30:32:24, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2149/17840 [3:38:26<30:32:24, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:26,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:26,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2150/17840 [3:38:35<33:23:52, 7.66s/it]g-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2150/17840 [3:38:35<33:23:52, 7.66s/it]g-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8726, 'learning_rate': 9.318289786223278e-05, 'epoch': 2.41} + 12%|████████▊ | 2150/17840 [3:38:35<33:23:52, 7.66s/it]g-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2150/17840 [3:38:35<33:23:52, 7.66s/it]g-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:10,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2152/17840 [3:38:48<31:20:02, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2152/17840 [3:38:48<31:20:02, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0084, 'learning_rate': 9.317102137767222e-05, 'epoch': 2.41} + 12%|████████▊ | 2152/17840 [3:38:48<31:20:02, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2153/17840 [3:38:55<30:44:43, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2153/17840 [3:38:55<30:44:43, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8299, 'learning_rate': 9.316508313539193e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:57,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:57,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2154/17840 [3:39:02<30:17:55, 6.95s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2154/17840 [3:39:02<30:17:55, 6.95s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2154/17840 [3:39:02<30:17:55, 6.95s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:05,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:05,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1473, 'learning_rate': 9.315320665083136e-05, 'epoch': 2.42} +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:09,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:09,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:09,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2156/17840 [3:39:15<29:41:16, 6.81s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:15,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:15,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:15,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:39:22<29:19:13, 6.73s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:39:22<29:19:13, 6.73s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:39:22<29:19:13, 6.73s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:39:22<29:19:13, 6.73s/it]g-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:25,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:25,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:25,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:32,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:32,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0934, 'learning_rate': 9.312945368171022e-05, 'epoch': 2.42} +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:32,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:32,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:32,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:47,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:39:41<28:49:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:39:41<28:49:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:39:41<28:49:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:39:41<28:49:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2161/17840 [3:39:48<28:29:30, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:48,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:48,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:48,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2162/17840 [3:39:54<28:17:40, 6.50s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2162/17840 [3:39:54<28:17:40, 6.50s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:56,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:56,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2163/17840 [3:40:00<28:02:08, 6.44s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2163/17840 [3:40:00<28:02:08, 6.44s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:02,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:02,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2164/17840 [3:40:07<27:47:37, 6.38s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2164/17840 [3:40:07<27:47:37, 6.38s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:08,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:08,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2165/17840 [3:40:13<27:30:21, 6.32s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2165/17840 [3:40:13<27:30:21, 6.32s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:14,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:14,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2166/17840 [3:40:19<27:18:11, 6.27s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2166/17840 [3:40:19<27:18:11, 6.27s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:21,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:21,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2167/17840 [3:40:25<27:09:11, 6.24s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2167/17840 [3:40:25<27:09:11, 6.24s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:27,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:27,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2168/17840 [3:40:31<26:53:45, 6.18s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2168/17840 [3:40:31<26:53:45, 6.18s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:33,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:33,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2169/17840 [3:40:37<26:34:01, 6.10s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:37,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:37,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:37,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2170/17840 [3:40:43<26:15:21, 6.03s/it]g-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:43,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:43,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:43,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:40,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2171/17840 [3:40:49<25:51:59, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:47,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2171/17840 [3:40:49<25:51:59, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:47,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2171/17840 [3:40:49<25:51:59, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:47,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2171/17840 [3:40:49<25:51:59, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:47,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2172/17840 [3:40:54<25:22:13, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:53,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2172/17840 [3:40:54<25:22:13, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:53,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:57,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:53,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:57,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:53,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:59,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:53,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:59,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:53,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:59,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:53,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2174/17840 [3:41:05<24:23:36, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:03,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2174/17840 [3:41:05<24:23:36, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:03,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2174/17840 [3:41:05<24:23:36, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:03,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2175/17840 [3:41:12<26:30:15, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:03,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2175/17840 [3:41:12<26:30:15, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:03,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8166, 'learning_rate': 9.303444180522565e-05, 'epoch': 2.44} +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:13,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:03,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:13,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:03,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2176/17840 [3:41:17<24:50:27, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:15,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:17,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:15,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:17,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:15,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2177/17840 [3:41:22<23:13:02, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:22,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:22,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2178/17840 [3:41:26<21:39:16, 4.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:24,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:26,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:24,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:26,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:24,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2179/17840 [3:41:29<20:02:26, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:27,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2180/17840 [3:41:33<18:21:03, 4.22s/it]g-point operations will not be computed-17 20:22:27,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2180/17840 [3:41:33<18:21:03, 4.22s/it]g-point operations will not be computed-17 20:22:27,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:32,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:31,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:32,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:31,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2181/17840 [3:41:36<16:34:09, 3.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:33,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2182/17840 [3:41:38<14:54:29, 3.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:36,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2182/17840 [3:41:38<14:54:29, 3.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:36,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2183/17840 [3:41:41<13:31:11, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:38,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2183/17840 [3:41:41<13:31:11, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:38,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:41:43<12:16:24, 2.82s/it]g-point operations will not be computed-17 20:22:38,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:41:43<12:16:24, 2.82s/it]g-point operations will not be computed-17 20:22:38,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:41:43<12:16:24, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:42,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:41:43<12:16:24, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:42,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:46,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:42,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:41:51<18:45:33, 4.31s/it]g-point operations will not be computed-17 20:22:42,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:41:51<18:45:33, 4.31s/it]g-point operations will not be computed-17 20:22:42,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:41:51<18:45:33, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:41:51<18:45:33, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:53,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:41:58<22:51:50, 5.26s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:41:58<22:51:50, 5.26s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7707, 'learning_rate': 9.29750593824228e-05, 'epoch': 2.45} + 12%|████████▉ | 2186/17840 [3:41:58<22:51:50, 5.26s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:02,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:02,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.179, 'learning_rate': 9.296912114014252e-05, 'epoch': 2.45} +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:02,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:02,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:42:13<27:34:07, 6.34s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:42:13<27:34:07, 6.34s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9481, 'learning_rate': 9.296318289786223e-05, 'epoch': 2.45} + 12%|████████▉ | 2188/17840 [3:42:13<27:34:07, 6.34s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:42:13<27:34:07, 6.34s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:42:13<27:34:07, 6.34s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2189/17840 [3:42:20<28:47:54, 6.62s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:21,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:21,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:42:27<29:39:22, 6.82s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:42:27<29:39:22, 6.82s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7497, 'learning_rate': 9.295130641330166e-05, 'epoch': 2.46} + 12%|████████▉ | 2190/17840 [3:42:27<29:39:22, 6.82s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:42:27<29:39:22, 6.82s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2191/17840 [3:42:34<30:02:20, 6.91s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2191/17840 [3:42:34<30:02:20, 6.91s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0459, 'learning_rate': 9.294536817102139e-05, 'epoch': 2.46} +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:37,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:42:42<30:22:32, 6.99s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:42:42<30:22:32, 6.99s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2171, 'learning_rate': 9.29394299287411e-05, 'epoch': 2.46} + 12%|████████▉ | 2192/17840 [3:42:42<30:22:32, 6.99s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:42:42<30:22:32, 6.99s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2193/17840 [3:42:49<30:38:37, 7.05s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2193/17840 [3:42:49<30:38:37, 7.05s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0718, 'learning_rate': 9.293349168646082e-05, 'epoch': 2.46} +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:51,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:42:56<30:45:51, 7.08s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:42:56<30:45:51, 7.08s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2459, 'learning_rate': 9.292755344418053e-05, 'epoch': 2.46} + 12%|████████▉ | 2194/17840 [3:42:56<30:45:51, 7.08s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:42:56<30:45:51, 7.08s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2195/17840 [3:43:03<30:40:14, 7.06s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2195/17840 [3:43:03<30:40:14, 7.06s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:03,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:03,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2196/17840 [3:43:10<30:35:04, 7.04s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2196/17840 [3:43:10<30:35:04, 7.04s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8646, 'learning_rate': 9.291567695961995e-05, 'epoch': 2.46} + 12%|████████▉ | 2196/17840 [3:43:10<30:35:04, 7.04s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:14,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:14,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7569, 'learning_rate': 9.290973871733967e-05, 'epoch': 2.46} +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:14,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:14,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2198/17840 [3:43:24<30:31:56, 7.03s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2198/17840 [3:43:24<30:31:56, 7.03s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6674, 'learning_rate': 9.29038004750594e-05, 'epoch': 2.46} + 12%|████████▉ | 2198/17840 [3:43:24<30:31:56, 7.03s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:28,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:28,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7829, 'learning_rate': 9.28978622327791e-05, 'epoch': 2.47} +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:28,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:28,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:43:40<33:17:11, 7.66s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:43:40<33:17:11, 7.66s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0128, 'learning_rate': 9.289192399049882e-05, 'epoch': 2.47} + 12%|█████████ | 2200/17840 [3:43:40<33:17:11, 7.66s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:44,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:44,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8649, 'learning_rate': 9.288598574821853e-05, 'epoch': 2.47} +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:44,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:44,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2202/17840 [3:43:54<31:34:05, 7.27s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2202/17840 [3:43:54<31:34:05, 7.27s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:54,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:54,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2203/17840 [3:44:01<31:03:53, 7.15s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2203/17840 [3:44:01<31:03:53, 7.15s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7208, 'learning_rate': 9.287410926365795e-05, 'epoch': 2.47} + 12%|█████████ | 2203/17840 [3:44:01<31:03:53, 7.15s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2203/17840 [3:44:01<31:03:53, 7.15s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:05,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:05,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:05,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:05,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:05,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2205/17840 [3:44:14<30:19:46, 6.98s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:15,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:15,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:15,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2206/17840 [3:44:21<29:59:41, 6.91s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2206/17840 [3:44:21<29:59:41, 6.91s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2206/17840 [3:44:21<29:59:41, 6.91s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:25,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:25,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6035, 'learning_rate': 9.285035629453682e-05, 'epoch': 2.47} +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:25,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:31,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:31,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8826, 'learning_rate': 9.284441805225653e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:31,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:31,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:31,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2209/17840 [3:44:41<29:08:12, 6.71s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:41,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:41,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:41,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2210/17840 [3:44:47<28:49:46, 6.64s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2210/17840 [3:44:47<28:49:46, 6.64s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:49,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:49,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2211/17840 [3:44:54<28:32:23, 6.57s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2211/17840 [3:44:54<28:32:23, 6.57s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2211/17840 [3:44:54<28:32:23, 6.57s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2211/17840 [3:44:54<28:32:23, 6.57s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:57,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:57,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:57,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:04,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:04,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7127, 'learning_rate': 9.281472684085512e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:04,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:10,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:10,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7662, 'learning_rate': 9.280878859857482e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:15,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2215/17840 [3:45:19<27:33:57, 6.35s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2215/17840 [3:45:19<27:33:57, 6.35s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0376, 'learning_rate': 9.280285035629455e-05, 'epoch': 2.48} + 12%|█████████ | 2215/17840 [3:45:19<27:33:57, 6.35s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:22,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:22,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.599, 'learning_rate': 9.279691211401425e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:22,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:28,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:28,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6691, 'learning_rate': 9.279097387173397e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:28,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:34,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:34,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6513, 'learning_rate': 9.278503562945369e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:38,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:38,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2219/17840 [3:45:43<25:55:43, 5.98s/it]g-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:43,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:43,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:43,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:49,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2220/17840 [3:45:49<25:32:24, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2220/17840 [3:45:49<25:32:24, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:51,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:51,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7744, 'learning_rate': 9.276722090261283e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:55,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:55,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2222/17840 [3:45:59<24:26:36, 5.63s/it]g-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:59,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:59,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:59,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2223/17840 [3:46:05<23:52:59, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2223/17840 [3:46:05<23:52:59, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2223/17840 [3:46:05<23:52:59, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:06,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:09,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:09,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2225/17840 [3:46:16<24:51:05, 5.73s/it]g-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2225/17840 [3:46:16<24:51:05, 5.73s/it]g-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:15,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:17,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:17,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8628, 'learning_rate': 9.273752969121141e-05, 'epoch': 2.5} + 12%|█████████ | 2227/17840 [3:46:24<21:12:58, 4.89s/it]g-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2227/17840 [3:46:24<21:12:58, 4.89s/it]g-point operations will not be computed-17 20:27:03,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2227/17840 [3:46:24<21:12:58, 4.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:22,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2228/17840 [3:46:28<19:40:11, 4.54s/it]g-point operations will not be computed-17 20:27:22,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2228/17840 [3:46:28<19:40:11, 4.54s/it]g-point operations will not be computed-17 20:27:22,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2228/17840 [3:46:28<19:40:11, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:26,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2228/17840 [3:46:28<19:40:11, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:26,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2229/17840 [3:46:31<18:09:46, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:29,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 2230/17840 [3:46:35<16:43:15, 3.86s/it]g-point operations will not be computed-17 20:27:29,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 2230/17840 [3:46:35<16:43:15, 3.86s/it]g-point operations will not be computed-17 20:27:29,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 2230/17840 [3:46:35<16:43:15, 3.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:32,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 2230/17840 [3:46:35<16:43:15, 3.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:32,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2231/17840 [3:46:37<15:24:24, 3.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:35,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2232/17840 [3:46:40<14:10:44, 3.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:38,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2232/17840 [3:46:40<14:10:44, 3.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:38,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2233/17840 [3:46:42<13:03:43, 3.01s/it]g-point operations will not be computed-17 20:27:38,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2233/17840 [3:46:42<13:03:43, 3.01s/it]g-point operations will not be computed-17 20:27:38,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:46:45<11:55:30, 2.75s/it]g-point operations will not be computed-17 20:27:40,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:46:45<11:55:30, 2.75s/it]g-point operations will not be computed-17 20:27:40,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:46:45<11:55:30, 2.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:44,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:46:45<11:55:30, 2.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:44,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:47,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:44,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:46:52<18:38:47, 4.30s/it]g-point operations will not be computed-17 20:27:44,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:46:52<18:38:47, 4.30s/it]g-point operations will not be computed-17 20:27:44,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:46:52<18:38:47, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:51,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:46:52<18:38:47, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:51,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:55,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:51,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:55,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:51,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2236/17840 [3:47:00<22:50:33, 5.27s/it]g-point operations will not be computed-17 20:27:51,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2236/17840 [3:47:00<22:50:33, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2236/17840 [3:47:00<22:50:33, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2236/17840 [3:47:00<22:50:33, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2236/17840 [3:47:00<22:50:33, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:47:08<25:45:28, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:47:08<25:45:28, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:10,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:47:15<27:36:30, 6.37s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:47:15<27:36:30, 6.37s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.096, 'learning_rate': 9.266627078384799e-05, 'epoch': 2.51} + 13%|█████████▏ | 2238/17840 [3:47:15<27:36:30, 6.37s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:47:15<27:36:30, 6.37s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:47:15<27:36:30, 6.37s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2239/17840 [3:47:22<28:50:39, 6.66s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2239/17840 [3:47:22<28:50:39, 6.66s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:25,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:47:29<29:37:52, 6.84s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:47:29<29:37:52, 6.84s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8373, 'learning_rate': 9.265439429928742e-05, 'epoch': 2.51} + 13%|█████████▏ | 2240/17840 [3:47:29<29:37:52, 6.84s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:47:29<29:37:52, 6.84s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2241/17840 [3:47:37<30:04:05, 6.94s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2241/17840 [3:47:37<30:04:05, 6.94s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0546, 'learning_rate': 9.264845605700713e-05, 'epoch': 2.51} + 13%|█████████▏ | 2241/17840 [3:47:37<30:04:05, 6.94s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:41,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:41,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7821, 'learning_rate': 9.264251781472685e-05, 'epoch': 2.51} +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:41,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:41,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2243/17840 [3:47:51<30:36:49, 7.07s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2243/17840 [3:47:51<30:36:49, 7.07s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9268, 'learning_rate': 9.263657957244655e-05, 'epoch': 2.51} + 13%|█████████▏ | 2243/17840 [3:47:51<30:36:49, 7.07s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:55,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:55,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9843, 'learning_rate': 9.263064133016627e-05, 'epoch': 2.52} +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:55,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:55,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2245/17840 [3:48:05<30:44:23, 7.10s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2245/17840 [3:48:05<30:44:23, 7.10s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1607, 'learning_rate': 9.262470308788599e-05, 'epoch': 2.52} + 13%|█████████▏ | 2245/17840 [3:48:05<30:44:23, 7.10s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:09,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:09,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8274, 'learning_rate': 9.261876484560571e-05, 'epoch': 2.52} +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:09,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:09,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2247/17840 [3:48:19<30:33:12, 7.05s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2247/17840 [3:48:19<30:33:12, 7.05s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9047, 'learning_rate': 9.261282660332542e-05, 'epoch': 2.52} +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:22,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:48:26<30:33:15, 7.05s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:48:26<30:33:15, 7.05s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7965, 'learning_rate': 9.260688836104513e-05, 'epoch': 2.52} + 13%|█████████▏ | 2248/17840 [3:48:26<30:33:15, 7.05s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:48:26<30:33:15, 7.05s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2249/17840 [3:48:33<30:24:26, 7.02s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2249/17840 [3:48:33<30:24:26, 7.02s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:34,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:34,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:48:43<33:22:52, 7.71s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:48:43<33:22:52, 7.71s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.621, 'learning_rate': 9.259501187648455e-05, 'epoch': 2.52} + 13%|█████████▏ | 2250/17840 [3:48:43<33:22:52, 7.71s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:48:43<33:22:52, 7.71s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2251/17840 [3:48:50<32:37:27, 7.53s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2251/17840 [3:48:50<32:37:27, 7.53s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:50,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:50,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2252/17840 [3:48:57<31:48:51, 7.35s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2252/17840 [3:48:57<31:48:51, 7.35s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8368, 'learning_rate': 9.2583135391924e-05, 'epoch': 2.52} + 13%|█████████▏ | 2252/17840 [3:48:57<31:48:51, 7.35s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2252/17840 [3:48:57<31:48:51, 7.35s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:00,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2254/17840 [3:49:10<30:40:51, 7.09s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:11,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:11,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:11,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2255/17840 [3:49:17<30:15:34, 6.99s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2255/17840 [3:49:17<30:15:34, 6.99s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:19,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:19,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:49:24<29:50:30, 6.89s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:49:24<29:50:30, 6.89s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:49:24<29:50:30, 6.89s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:49:24<29:50:30, 6.89s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:49:24<29:50:30, 6.89s/it]g-point operations will not be computed-17 20:27:59,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2257/17840 [3:49:30<29:30:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2257/17840 [3:49:30<29:30:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2257/17840 [3:49:30<29:30:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2257/17840 [3:49:30<29:30:08, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2258/17840 [3:49:37<29:11:52, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:37,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:37,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:37,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2259/17840 [3:49:43<28:43:26, 6.64s/it]g-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:43,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:43,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:43,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2260/17840 [3:49:50<28:21:57, 6.55s/it]g-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2260/17840 [3:49:50<28:21:57, 6.55s/it]g-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:51,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2261/17840 [3:49:56<28:11:36, 6.51s/it]g-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2261/17840 [3:49:56<28:11:36, 6.51s/it]g-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7043, 'learning_rate': 9.252969121140142e-05, 'epoch': 2.53} + 13%|█████████▎ | 2261/17840 [3:49:56<28:11:36, 6.51s/it]g-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:59,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:59,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8931, 'learning_rate': 9.252375296912114e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:59,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:59,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:59,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:30:29,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2263/17840 [3:50:09<27:56:06, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:07,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2263/17840 [3:50:09<27:56:06, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:07,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2263/17840 [3:50:09<27:56:06, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:07,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2263/17840 [3:50:09<27:56:06, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:07,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2264/17840 [3:50:15<27:33:35, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:14,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2264/17840 [3:50:15<27:33:35, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:14,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2264/17840 [3:50:15<27:33:35, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:14,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2264/17840 [3:50:15<27:33:35, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:14,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2265/17840 [3:50:21<27:14:40, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:20,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2265/17840 [3:50:21<27:14:40, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:20,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2265/17840 [3:50:21<27:14:40, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:20,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2265/17840 [3:50:21<27:14:40, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:20,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2266/17840 [3:50:27<26:55:32, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2266/17840 [3:50:27<26:55:32, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:30,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:30,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9074, 'learning_rate': 9.249406175771972e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:30,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:36,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:36,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8172, 'learning_rate': 9.248812351543944e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:40,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2269/17840 [3:50:45<25:58:47, 6.01s/it]g-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2269/17840 [3:50:45<25:58:47, 6.01s/it]g-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9364, 'learning_rate': 9.248218527315915e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:46,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:46,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2270/17840 [3:50:51<25:35:00, 5.92s/it]g-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:50,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:50,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:50,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2271/17840 [3:50:56<25:13:30, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:55,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2271/17840 [3:50:56<25:13:30, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:55,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2271/17840 [3:50:56<25:13:30, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:55,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2271/17840 [3:50:56<25:13:30, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:55,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2272/17840 [3:51:02<24:59:02, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:00,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2272/17840 [3:51:02<24:59:02, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:00,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:04,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:00,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:04,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:00,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8409, 'learning_rate': 9.245843230403801e-05, 'epoch': 2.55} +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:08,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:00,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:08,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:00,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2274/17840 [3:51:12<23:45:20, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2274/17840 [3:51:12<23:45:20, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2274/17840 [3:51:12<23:45:20, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2275/17840 [3:51:19<25:37:08, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2275/17840 [3:51:19<25:37:08, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:19,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:21,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:21,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:23,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:23,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:23,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:11,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2277/17840 [3:51:28<22:19:16, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:26,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:28,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:26,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:28,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:26,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2278/17840 [3:51:32<20:40:51, 4.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:30,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2279/17840 [3:51:36<19:04:21, 4.41s/it]g-point operations will not be computed-17 20:32:30,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2279/17840 [3:51:36<19:04:21, 4.41s/it]g-point operations will not be computed-17 20:32:30,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:35,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:34,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:35,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:34,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2280/17840 [3:51:39<17:38:10, 4.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:37,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2281/17840 [3:51:42<16:12:59, 3.75s/it]g-point operations will not be computed-17 20:32:37,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2281/17840 [3:51:42<16:12:59, 3.75s/it]g-point operations will not be computed-17 20:32:37,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:41,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:40,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:41,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:40,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:42,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:42,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2283/17840 [3:51:47<13:35:33, 3.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:45,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2283/17840 [3:51:47<13:35:33, 3.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:45,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2284/17840 [3:51:49<12:17:56, 2.85s/it]g-point operations will not be computed-17 20:32:45,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2284/17840 [3:51:49<12:17:56, 2.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:48,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2284/17840 [3:51:49<12:17:56, 2.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:48,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:52,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:48,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:52,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:48,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2285/17840 [3:51:57<18:44:29, 4.34s/it]g-point operations will not be computed-17 20:32:48,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2285/17840 [3:51:57<18:44:29, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:56,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2285/17840 [3:51:57<18:44:29, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:56,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:52:05<22:53:56, 5.30s/it]g-point operations will not be computed-17 20:32:56,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:52:05<22:53:56, 5.30s/it]g-point operations will not be computed-17 20:32:56,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:52:05<22:53:56, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:52:05<22:53:56, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:52:05<22:53:56, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:52:12<25:44:22, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:52:12<25:44:22, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.795, 'learning_rate': 9.237529691211402e-05, 'epoch': 2.56} + 13%|█████████▎ | 2287/17840 [3:52:12<25:44:22, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:52:12<25:44:22, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:52:12<25:44:22, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2288/17840 [3:52:20<27:35:11, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:20,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:20,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2289/17840 [3:52:27<28:50:31, 6.68s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2289/17840 [3:52:27<28:50:31, 6.68s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6531, 'learning_rate': 9.236342042755344e-05, 'epoch': 2.57} + 13%|█████████▎ | 2289/17840 [3:52:27<28:50:31, 6.68s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2289/17840 [3:52:27<28:50:31, 6.68s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2290/17840 [3:52:34<29:34:56, 6.85s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2290/17840 [3:52:34<29:34:56, 6.85s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:35,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:35,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2291/17840 [3:52:42<30:08:29, 6.98s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2291/17840 [3:52:42<30:08:29, 6.98s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8311, 'learning_rate': 9.235154394299289e-05, 'epoch': 2.57} + 13%|█████████▎ | 2291/17840 [3:52:42<30:08:29, 6.98s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2291/17840 [3:52:42<30:08:29, 6.98s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2292/17840 [3:52:49<30:22:11, 7.03s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2292/17840 [3:52:49<30:22:11, 7.03s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:49,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:49,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2293/17840 [3:52:56<30:32:08, 7.07s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2293/17840 [3:52:56<30:32:08, 7.07s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0941, 'learning_rate': 9.233966745843231e-05, 'epoch': 2.57} + 13%|█████████▍ | 2293/17840 [3:52:56<30:32:08, 7.07s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2293/17840 [3:52:56<30:32:08, 7.07s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2293/17840 [3:52:56<30:32:08, 7.07s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2294/17840 [3:53:03<30:36:45, 7.09s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2294/17840 [3:53:03<30:36:45, 7.09s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:05,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:05,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2295/17840 [3:53:10<30:36:15, 7.09s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2295/17840 [3:53:10<30:36:15, 7.09s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2295/17840 [3:53:10<30:36:15, 7.09s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2295/17840 [3:53:10<30:36:15, 7.09s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2295/17840 [3:53:10<30:36:15, 7.09s/it]g-point operations will not be computed-17 20:33:04,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:53:17<30:27:32, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:53:17<30:27:32, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:53:17<30:27:32, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:53:17<30:27:32, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:53:24<30:26:04, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|███████��█▍ | 2297/17840 [3:53:24<30:26:04, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:53:24<30:26:04, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:53:24<30:26:04, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:53:24<30:26:04, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2298/17840 [3:53:31<30:26:22, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2298/17840 [3:53:31<30:26:22, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2298/17840 [3:53:31<30:26:22, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2298/17840 [3:53:31<30:26:22, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2299/17840 [3:53:38<30:21:54, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2299/17840 [3:53:38<30:21:54, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:40,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2300/17840 [3:53:48<33:20:49, 7.73s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2300/17840 [3:53:48<33:20:49, 7.73s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7317, 'learning_rate': 9.229809976247031e-05, 'epoch': 2.58} + 13%|█████████▍ | 2300/17840 [3:53:48<33:20:49, 7.73s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2300/17840 [3:53:48<33:20:49, 7.73s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2300/17840 [3:53:48<33:20:49, 7.73s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2301/17840 [3:53:54<32:24:16, 7.51s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:55,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:55,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:54:01<31:28:08, 7.29s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:54:01<31:28:08, 7.29s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.747, 'learning_rate': 9.228622327790974e-05, 'epoch': 2.58} + 13%|█████████▍ | 2302/17840 [3:54:01<31:28:08, 7.29s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:54:01<31:28:08, 7.29s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:54:01<31:28:08, 7.29s/it]g-point operations will not be computed-17 20:34:30,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2303/17840 [3:54:08<30:52:04, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2303/17840 [3:54:08<30:52:04, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2303/17840 [3:54:08<30:52:04, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2303/17840 [3:54:08<30:52:04, 7.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2304/17840 [3:54:15<30:23:33, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2304/17840 [3:54:15<30:23:33, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:17,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:54:22<29:59:47, 6.95s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:54:22<29:59:47, 6.95s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9437, 'learning_rate': 9.226840855106889e-05, 'epoch': 2.58} + 13%|█████████▍ | 2305/17840 [3:54:22<29:59:47, 6.95s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:25,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:25,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6339, 'learning_rate': 9.226247030878861e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:25,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:25,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:25,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2307/17840 [3:54:35<29:22:42, 6.81s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:35,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:35,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2308/17840 [3:54:42<29:15:41, 6.78s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2308/17840 [3:54:42<29:15:41, 6.78s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9309, 'learning_rate': 9.225059382422804e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:44,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2309/17840 [3:54:48<28:59:30, 6.72s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2309/17840 [3:54:48<28:59:30, 6.72s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7875, 'learning_rate': 9.224465558194774e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:50,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2310/17840 [3:54:55<28:40:28, 6.65s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2310/17840 [3:54:55<28:40:28, 6.65s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7954, 'learning_rate': 9.223871733966746e-05, 'epoch': 2.59} + 13%|█████████▍ | 2310/17840 [3:54:55<28:40:28, 6.65s/it]g-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:58,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:58,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6163, 'learning_rate': 9.223277909738718e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:58,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:58,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:58,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:35:07,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2312/17840 [3:55:08<28:14:08, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2312/17840 [3:55:08<28:14:08, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2312/17840 [3:55:08<28:14:08, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2312/17840 [3:55:08<28:14:08, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2313/17840 [3:55:14<28:01:27, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:14,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:14,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2314/17840 [3:55:20<27:52:23, 6.46s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2314/17840 [3:55:20<27:52:23, 6.46s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7297, 'learning_rate': 9.221496437054632e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:22,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2315/17840 [3:55:27<27:41:12, 6.42s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2315/17840 [3:55:27<27:41:12, 6.42s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9698, 'learning_rate': 9.220902612826604e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:28,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2316/17840 [3:55:33<27:29:10, 6.37s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2316/17840 [3:55:33<27:29:10, 6.37s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5971, 'learning_rate': 9.220308788598575e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:35,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2317/17840 [3:55:39<27:14:39, 6.32s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2317/17840 [3:55:39<27:14:39, 6.32s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6569, 'learning_rate': 9.219714964370547e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:41,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2318/17840 [3:55:45<26:57:12, 6.25s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2318/17840 [3:55:45<26:57:12, 6.25s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.673, 'learning_rate': 9.219121140142519e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:47,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2319/17840 [3:55:51<26:35:18, 6.17s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2319/17840 [3:55:51<26:35:18, 6.17s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2953, 'learning_rate': 9.21852731591449e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:53,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2320/17840 [3:55:57<26:13:37, 6.08s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2320/17840 [3:55:57<26:13:37, 6.08s/it]g-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:57,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:57,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:06,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2321/17840 [3:56:03<25:48:48, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2321/17840 [3:56:03<25:48:48, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0074, 'learning_rate': 9.217339667458432e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:05,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:05,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9504, 'learning_rate': 9.216745843230404e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:10,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2323/17840 [3:56:14<24:50:07, 5.76s/it]g-point operations will not be computed-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2323/17840 [3:56:14<24:50:07, 5.76s/it]g-point operations will not be computed-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:14,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:14,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:01,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2324/17840 [3:56:19<24:09:38, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2324/17840 [3:56:19<24:09:38, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7833, 'learning_rate': 9.215558194774348e-05, 'epoch': 2.61} + 13%|█████████▌ | 2324/17840 [3:56:19<24:09:38, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2325/17840 [3:56:27<26:14:34, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2325/17840 [3:56:27<26:14:34, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:26,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:28,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:28,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:28,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:31,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:18,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2327/17840 [3:56:36<22:50:04, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:34,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2327/17840 [3:56:36<22:50:04, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:34,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:36,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:34,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2328/17840 [3:56:40<21:18:08, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:38,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2328/17840 [3:56:40<21:18:08, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:38,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:40,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:38,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2329/17840 [3:56:43<19:44:40, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:41,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2329/17840 [3:56:43<19:44:40, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:41,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2330/17840 [3:56:47<18:10:14, 4.22s/it]g-point operations will not be computed-17 20:37:41,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2330/17840 [3:56:47<18:10:14, 4.22s/it]g-point operations will not be computed-17 20:37:41,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2330/17840 [3:56:47<18:10:14, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:45,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2331/17840 [3:56:50<16:39:40, 3.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:48,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2331/17840 [3:56:50<16:39:40, 3.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:48,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2332/17840 [3:56:53<15:07:50, 3.51s/it]g-point operations will not be computed-17 20:37:48,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2332/17840 [3:56:53<15:07:50, 3.51s/it]g-point operations will not be computed-17 20:37:48,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2333/17840 [3:56:55<13:43:48, 3.19s/it]g-point operations will not be computed-17 20:37:50,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2333/17840 [3:56:55<13:43:48, 3.19s/it]g-point operations will not be computed-17 20:37:50,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9659, 'learning_rate': 9.210213776722091e-05, 'epoch': 2.62} + g-point operations will not be computed-17 20:37:53,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2334/17840 [3:56:57<12:19:27, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:56,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2334/17840 [3:56:57<12:19:27, 2.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:56,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:00,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:56,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:00,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:56,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2335/17840 [3:57:05<18:52:58, 4.38s/it]g-point operations will not be computed-17 20:37:56,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2335/17840 [3:57:05<18:52:58, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2335/17840 [3:57:05<18:52:58, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:08,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:08,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:57:13<22:59:52, 5.34s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:57:13<22:59:52, 5.34s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:57:13<22:59:52, 5.34s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:57:13<22:59:52, 5.34s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:57:13<22:59:52, 5.34s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:57:20<25:48:12, 5.99s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:57:20<25:48:12, 5.99s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:57:20<25:48:12, 5.99s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:57:20<25:48:12, 5.99s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:24,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:24,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:24,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:24,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:24,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:57:35<28:55:05, 6.72s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:57:35<28:55:05, 6.72s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:57:35<28:55:05, 6.72s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:57:35<28:55:05, 6.72s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:57:35<28:55:05, 6.72s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2340/17840 [3:57:42<29:46:42, 6.92s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:43,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:43,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:43,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:57:50<30:12:28, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:57:50<30:12:28, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:57:50<30:12:28, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:57:50<30:12:28, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:57:50<30:12:28, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2342/17840 [3:57:57<30:32:07, 7.09s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:57,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:57,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:01,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:01,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:01,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:01,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:01,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:58:11<30:58:51, 7.20s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:58:11<30:58:51, 7.20s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:58:11<30:58:51, 7.20s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:15,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:15,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7478, 'learning_rate': 9.203087885985749e-05, 'epoch': 2.63} +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:15,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:15,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:15,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2346/17840 [3:58:26<30:48:33, 7.16s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2346/17840 [3:58:26<30:48:33, 7.16s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2346/17840 [3:58:26<30:48:33, 7.16s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:30,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:30,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9517, 'learning_rate': 9.201900237529691e-05, 'epoch': 2.63} +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:30,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:30,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:30,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2348/17840 [3:58:40<30:22:01, 7.06s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2348/17840 [3:58:40<30:22:01, 7.06s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:42,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:42,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2349/17840 [3:58:47<30:12:06, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2349/17840 [3:58:47<30:12:06, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2349/17840 [3:58:47<30:12:06, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2349/17840 [3:58:47<30:12:06, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2349/17840 [3:58:47<30:12:06, 7.02s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2350/17840 [3:58:56<33:15:47, 7.73s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:56,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:56,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2351/17840 [3:59:03<32:15:30, 7.50s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2351/17840 [3:59:03<32:15:30, 7.50s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.775, 'learning_rate': 9.199524940617578e-05, 'epoch': 2.64} + 13%|█████████▌ | 2351/17840 [3:59:03<32:15:30, 7.50s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2351/17840 [3:59:03<32:15:30, 7.50s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2351/17840 [3:59:03<32:15:30, 7.50s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2352/17840 [3:59:10<31:27:04, 7.31s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:10,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:10,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:10,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2353/17840 [3:59:17<30:47:08, 7.16s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2353/17840 [3:59:17<30:47:08, 7.16s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2353/17840 [3:59:17<30:47:08, 7.16s/it]g-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:20,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:20,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8272, 'learning_rate': 9.197743467933492e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:20,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:20,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:20,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:04,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:59:30<29:53:16, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:59:30<29:53:16, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:59:30<29:53:16, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:59:30<29:53:16, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2356/17840 [3:59:37<29:32:36, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2356/17840 [3:59:37<29:32:36, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:39,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:43<29:13:30, 6.80s/it]g-point operations will not be computed-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:43<29:13:30, 6.80s/it]g-point operations will not be computed-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7087, 'learning_rate': 9.195961995249406e-05, 'epoch': 2.64} + 13%|█████████▋ | 2357/17840 [3:59:43<29:13:30, 6.80s/it]g-point operations will not be computed-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:43<29:13:30, 6.80s/it]g-point operations will not be computed-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:43<29:13:30, 6.80s/it]g-point operations will not be computed-17 20:40:29,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2358/17840 [3:59:50<29:03:39, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:49,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2358/17840 [3:59:50<29:03:39, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:49,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2358/17840 [3:59:50<29:03:39, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:49,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2358/17840 [3:59:50<29:03:39, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:49,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2359/17840 [3:59:57<28:43:31, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2359/17840 [3:59:57<28:43:31, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2359/17840 [3:59:57<28:43:31, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2359/17840 [3:59:57<28:43:31, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2360/17840 [4:00:03<28:22:34, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:03,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:03,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:03,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2361/17840 [4:00:09<28:08:20, 6.54s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:10,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:10,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2362/17840 [4:00:16<27:54:33, 6.49s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2362/17840 [4:00:16<27:54:33, 6.49s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7611, 'learning_rate': 9.192992874109264e-05, 'epoch': 2.65} +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:17,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2363/17840 [4:00:22<27:43:05, 6.45s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2363/17840 [4:00:22<27:43:05, 6.45s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9004, 'learning_rate': 9.192399049881234e-05, 'epoch': 2.65} + 13%|█████████▋ | 2363/17840 [4:00:22<27:43:05, 6.45s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:25,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:25,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8853, 'learning_rate': 9.191805225653208e-05, 'epoch': 2.65} +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:25,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:32,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:32,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.664, 'learning_rate': 9.191211401425179e-05, 'epoch': 2.65} +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:32,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:38,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:38,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8319, 'learning_rate': 9.19061757719715e-05, 'epoch': 2.65} +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:38,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:44,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:44,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7399, 'learning_rate': 9.190023752969121e-05, 'epoch': 2.65} +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:48,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2368/17840 [4:00:53<26:23:02, 6.14s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2368/17840 [4:00:53<26:23:02, 6.14s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8979, 'learning_rate': 9.189429928741093e-05, 'epoch': 2.65} +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:54,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2369/17840 [4:00:59<26:10:11, 6.09s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2369/17840 [4:00:59<26:10:11, 6.09s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7376, 'learning_rate': 9.188836104513064e-05, 'epoch': 2.66} +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:00,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2370/17840 [4:01:05<25:44:03, 5.99s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2370/17840 [4:01:05<25:44:03, 5.99s/it]g-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:05,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:05,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:55,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2371/17840 [4:01:10<25:17:26, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2371/17840 [4:01:10<25:17:26, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.781, 'learning_rate': 9.187648456057008e-05, 'epoch': 2.66} +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:13,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:13,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7693, 'learning_rate': 9.187054631828979e-05, 'epoch': 2.66} +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:17,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2373/17840 [4:01:21<24:11:59, 5.63s/it]g-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2373/17840 [4:01:21<24:11:59, 5.63s/it]g-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:21,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:21,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:21,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2374/17840 [4:01:26<23:34:04, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:27,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2375/17840 [4:01:33<25:19:32, 5.90s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2375/17840 [4:01:33<25:19:32, 5.90s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:33,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:35,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:35,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:37,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:39,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:39,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:41,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:43,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:43,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:45,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:47,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:47,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:48,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:50,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:50,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:53,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:53,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:54,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:57,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:57,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:59,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:59,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:00,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:00,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.3808, 'learning_rate': 9.179928741092638e-05, 'epoch': 2.67} +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:04,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:04,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:08,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:08,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1807, 'learning_rate': 9.179334916864608e-05, 'epoch': 2.67} +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:12,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:15,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:15,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9304, 'learning_rate': 9.17874109263658e-05, 'epoch': 2.67} +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:15,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:15,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2387/17840 [4:02:26<25:22:53, 5.91s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2387/17840 [4:02:26<25:22:53, 5.91s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8673, 'learning_rate': 9.178147268408551e-05, 'epoch': 2.68} + 13%|█████████▊ | 2387/17840 [4:02:26<25:22:53, 5.91s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2387/17840 [4:02:26<25:22:53, 5.91s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [4:02:33<27:06:15, 6.31s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [4:02:33<27:06:15, 6.31s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9106, 'learning_rate': 9.177553444180523e-05, 'epoch': 2.68} + 13%|█████████▊ | 2388/17840 [4:02:33<27:06:15, 6.31s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:37,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:37,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7837, 'learning_rate': 9.176959619952494e-05, 'epoch': 2.68} +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:37,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:37,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [4:02:48<29:14:35, 6.81s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [4:02:48<29:14:35, 6.81s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.88, 'learning_rate': 9.176365795724466e-05, 'epoch': 2.68} + 13%|█████████▊ | 2390/17840 [4:02:48<29:14:35, 6.81s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:52,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:52,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7558, 'learning_rate': 9.175771971496438e-05, 'epoch': 2.68} +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:52,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:52,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2392/17840 [4:03:02<30:06:19, 7.02s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2392/17840 [4:03:02<30:06:19, 7.02s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8242, 'learning_rate': 9.17517814726841e-05, 'epoch': 2.68} + 13%|█████████▊ | 2392/17840 [4:03:02<30:06:19, 7.02s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9727, 'learning_rate': 9.17458432304038e-05, 'epoch': 2.68} +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [4:03:17<30:26:03, 7.09s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [4:03:17<30:26:03, 7.09s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5685, 'learning_rate': 9.173990498812351e-05, 'epoch': 2.68} + 13%|█████████▊ | 2394/17840 [4:03:17<30:26:03, 7.09s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [4:03:17<30:26:03, 7.09s/it]g-point operations will not be computed-17 20:42:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2395/17840 [4:03:24<30:21:17, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2395/17840 [4:03:24<30:21:17, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7642, 'learning_rate': 9.173396674584323e-05, 'epoch': 2.68} + 13%|█████████▊ | 2395/17840 [4:03:24<30:21:17, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2396/17840 [4:03:31<30:13:48, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2396/17840 [4:03:31<30:13:48, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9469, 'learning_rate': 9.172802850356294e-05, 'epoch': 2.69} +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:33,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:33,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [4:03:38<30:07:53, 7.02s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [4:03:38<30:07:53, 7.02s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [4:03:38<30:07:53, 7.02s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [4:03:38<30:07:53, 7.02s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [4:03:38<30:07:53, 7.02s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2398/17840 [4:03:45<30:08:16, 7.03s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2398/17840 [4:03:45<30:08:16, 7.03s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:47,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:47,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2399/17840 [4:03:52<30:00:17, 7.00s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2399/17840 [4:03:52<30:00:17, 7.00s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2399/17840 [4:03:52<30:00:17, 7.00s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2399/17840 [4:03:52<30:00:17, 7.00s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2399/17840 [4:03:52<30:00:17, 7.00s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [4:04:01<32:56:45, 7.68s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:01,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:01,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:01,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [4:04:08<32:05:51, 7.48s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [4:04:08<32:05:51, 7.48s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [4:04:08<32:05:51, 7.48s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [4:04:08<32:05:51, 7.48s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [4:04:08<32:05:51, 7.48s/it]g-point operations will not be computed-17 20:44:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2402/17840 [4:04:15<31:21:34, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2402/17840 [4:04:15<31:21:34, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2402/17840 [4:04:15<31:21:34, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2402/17840 [4:04:15<31:21:34, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [4:04:22<30:46:41, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [4:04:22<30:46:41, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [4:04:22<30:46:41, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:25,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:25,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.65, 'learning_rate': 9.168052256532068e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:25,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:25,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:25,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2405/17840 [4:04:35<29:51:49, 6.97s/it]g-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2406/17840 [4:04:42<29:25:42, 6.86s/it]g-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:42,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:42,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:42,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2407/17840 [4:04:48<29:07:32, 6.79s/it]g-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2407/17840 [4:04:48<29:07:32, 6.79s/it]g-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:50,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [4:04:55<28:57:06, 6.75s/it]g-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [4:04:55<28:57:06, 6.75s/it]g-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8516, 'learning_rate': 9.165676959619953e-05, 'epoch': 2.7} + 13%|█████████▊ | 2408/17840 [4:04:55<28:57:06, 6.75s/it]g-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7264, 'learning_rate': 9.165083135391924e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:59,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:13,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2410/17840 [4:05:08<28:24:43, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:07,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2410/17840 [4:05:08<28:24:43, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:07,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2410/17840 [4:05:08<28:24:43, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:07,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2410/17840 [4:05:08<28:24:43, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:07,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2411/17840 [4:05:15<28:09:42, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2411/17840 [4:05:15<28:09:42, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2411/17840 [4:05:15<28:09:42, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2411/17840 [4:05:15<28:09:42, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2412/17840 [4:05:21<27:57:23, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:21,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:21,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:21,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2413/17840 [4:05:27<27:45:21, 6.48s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:28,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:28,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2414/17840 [4:05:34<27:36:06, 6.44s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2414/17840 [4:05:34<27:36:06, 6.44s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9009, 'learning_rate': 9.162114014251781e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:35,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2415/17840 [4:05:40<27:26:35, 6.40s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2415/17840 [4:05:40<27:26:35, 6.40s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0366, 'learning_rate': 9.161520190023753e-05, 'epoch': 2.71} + 14%|█████████▉ | 2415/17840 [4:05:40<27:26:35, 6.40s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:43,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:43,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7721, 'learning_rate': 9.160926365795724e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:48,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2417/17840 [4:05:53<27:06:46, 6.33s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2417/17840 [4:05:53<27:06:46, 6.33s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7929, 'learning_rate': 9.160332541567696e-05, 'epoch': 2.71} + 14%|█████████▉ | 2417/17840 [4:05:53<27:06:46, 6.33s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:56,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:56,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9579, 'learning_rate': 9.159738717339668e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:00,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2419/17840 [4:06:04<26:15:54, 6.13s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2419/17840 [4:06:04<26:15:54, 6.13s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:04,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:04,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2420/17840 [4:06:10<25:50:19, 6.03s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2420/17840 [4:06:10<25:50:19, 6.03s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:10,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:10,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2421/17840 [4:06:16<25:23:23, 5.93s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2421/17840 [4:06:16<25:23:23, 5.93s/it]g-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:16,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:16,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:16,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2422/17840 [4:06:21<24:53:15, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:20,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2422/17840 [4:06:21<24:53:15, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:20,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:24,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:20,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:24,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:20,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:26,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:20,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:26,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:20,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2424/17840 [4:06:32<23:49:18, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:30,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2424/17840 [4:06:32<23:49:18, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:30,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6564, 'learning_rate': 9.156175771971497e-05, 'epoch': 2.72} + 14%|█████████▉ | 2424/17840 [4:06:32<23:49:18, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:30,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2425/17840 [4:06:39<25:54:08, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:30,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2425/17840 [4:06:39<25:54:08, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:30,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.765, 'learning_rate': 9.155581947743468e-05, 'epoch': 2.72} +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:40,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:30,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:40,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:30,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2426/17840 [4:06:44<24:19:12, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:42,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:44,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:42,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:44,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:42,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2427/17840 [4:06:49<22:36:19, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:47,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:49,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:47,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:49,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:47,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2428/17840 [4:06:53<21:02:17, 4.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:51,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:52,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:51,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:52,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:51,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2429/17840 [4:06:56<19:30:13, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:54,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2429/17840 [4:06:56<19:30:13, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:54,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2430/17840 [4:07:00<18:07:10, 4.23s/it]g-point operations will not be computed-17 20:47:54,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:58,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:59,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:58,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2431/17840 [4:07:03<16:41:51, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:48:01,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2431/17840 [4:07:03<16:41:51, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:48:01,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2432/17840 [4:07:06<15:18:05, 3.58s/it]g-point operations will not be computed-17 20:48:01,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████��█▉ | 2432/17840 [4:07:06<15:18:05, 3.58s/it]g-point operations will not be computed-17 20:48:01,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2433/17840 [4:07:08<13:47:36, 3.22s/it]g-point operations will not be computed-17 20:48:03,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2433/17840 [4:07:08<13:47:36, 3.22s/it]g-point operations will not be computed-17 20:48:03,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 20:48:06,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2434/17840 [4:07:10<12:22:06, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:48:09,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2434/17840 [4:07:10<12:22:06, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:48:09,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:13,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:09,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:13,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:09,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2435/17840 [4:07:18<18:43:27, 4.38s/it]g-point operations will not be computed-17 20:48:09,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2435/17840 [4:07:18<18:43:27, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2435/17840 [4:07:18<18:43:27, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:21,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:21,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:07:26<22:54:20, 5.35s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:07:26<22:54:20, 5.35s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:07:26<22:54:20, 5.35s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:07:26<22:54:20, 5.35s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:07:26<22:54:20, 5.35s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [4:07:33<25:37:45, 5.99s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [4:07:33<25:37:45, 5.99s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:36,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:36,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:41<27:26:30, 6.41s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:41<27:26:30, 6.41s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:41<27:26:30, 6.41s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:41<27:26:30, 6.41s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:41<27:26:30, 6.41s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [4:07:48<28:36:39, 6.69s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [4:07:48<28:36:39, 6.69s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [4:07:48<28:36:39, 6.69s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:52,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:52,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0193, 'learning_rate': 9.14667458432304e-05, 'epoch': 2.74} +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:52,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:52,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:52,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:08:02<29:48:12, 6.97s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:08:02<29:48:12, 6.97s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:08:02<29:48:12, 6.97s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:08:02<29:48:12, 6.97s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:08:02<29:48:12, 6.97s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2442/17840 [4:08:10<30:09:22, 7.05s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:10,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:10,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:10,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:08:17<30:22:51, 7.10s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:08:17<30:22:51, 7.10s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:08:17<30:22:51, 7.10s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:08:17<30:22:51, 7.10s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:08:17<30:22:51, 7.10s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2444/17840 [4:08:24<30:31:37, 7.14s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2444/17840 [4:08:24<30:31:37, 7.14s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:26,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [4:08:31<30:26:25, 7.12s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [4:08:31<30:26:25, 7.12s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8633, 'learning_rate': 9.143705463182898e-05, 'epoch': 2.74} + 14%|██████████ | 2445/17840 [4:08:31<30:26:25, 7.12s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [4:08:31<30:26:25, 7.12s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [4:08:31<30:26:25, 7.12s/it]g-point operations will not be computed-17 20:48:17,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2446/17840 [4:08:38<30:14:20, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2446/17840 [4:08:38<30:14:20, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2446/17840 [4:08:38<30:14:20, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2447/17840 [4:08:45<30:09:23, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2447/17840 [4:08:45<30:09:23, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8524, 'learning_rate': 9.142517814726841e-05, 'epoch': 2.74} + 14%|██████████ | 2447/17840 [4:08:45<30:09:23, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2447/17840 [4:08:45<30:09:23, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2447/17840 [4:08:45<30:09:23, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:37,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [4:08:52<30:01:43, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [4:08:52<30:01:43, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [4:08:52<30:01:43, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [4:08:52<30:01:43, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2449/17840 [4:08:59<29:50:08, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2449/17840 [4:08:59<29:50:08, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2449/17840 [4:08:59<29:50:08, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2449/17840 [4:08:59<29:50:08, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:09:08<32:41:14, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:09:08<32:41:14, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8569, 'learning_rate': 9.140736342042756e-05, 'epoch': 2.75} + 14%|██████████ | 2450/17840 [4:09:08<32:41:14, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:09:08<32:41:14, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:09:08<32:41:14, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:51,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [4:09:15<31:42:46, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [4:09:15<31:42:46, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [4:09:15<31:42:46, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2452/17840 [4:09:22<30:55:51, 7.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2452/17840 [4:09:22<30:55:51, 7.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0457, 'learning_rate': 9.1395486935867e-05, 'epoch': 2.75} + 14%|██████████ | 2452/17840 [4:09:22<30:55:51, 7.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:26,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:26,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7883, 'learning_rate': 9.13895486935867e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:26,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:26,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:26,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:14,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2454/17840 [4:09:35<29:53:54, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2454/17840 [4:09:35<29:53:54, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2454/17840 [4:09:35<29:53:54, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2455/17840 [4:09:42<29:30:34, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2455/17840 [4:09:42<29:30:34, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7368, 'learning_rate': 9.137767220902613e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:44,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2456/17840 [4:09:49<29:10:16, 6.83s/it]g-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2456/17840 [4:09:49<29:10:16, 6.83s/it]g-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.712, 'learning_rate': 9.137173396674584e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:51,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2457/17840 [4:09:55<28:50:55, 6.75s/it]g-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2457/17840 [4:09:55<28:50:55, 6.75s/it]g-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9617, 'learning_rate': 9.136579572446557e-05, 'epoch': 2.75} + 14%|██████████ | 2457/17840 [4:09:55<28:50:55, 6.75s/it]g-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:59,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:59,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7964, 'learning_rate': 9.135985748218528e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:59,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:59,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:34,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2459/17840 [4:10:08<28:15:23, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2459/17840 [4:10:08<28:15:23, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5358, 'learning_rate': 9.1353919239905e-05, 'epoch': 2.76} + 14%|██████████ | 2459/17840 [4:10:08<28:15:23, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2460/17840 [4:10:15<28:03:38, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2460/17840 [4:10:15<28:03:38, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7774, 'learning_rate': 9.13479809976247e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:17,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2461/17840 [4:10:21<27:54:57, 6.53s/it]g-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2461/17840 [4:10:21<27:54:57, 6.53s/it]g-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1415, 'learning_rate': 9.134204275534442e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:23,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [4:10:28<27:38:19, 6.47s/it]g-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [4:10:28<27:38:19, 6.47s/it]g-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7756, 'learning_rate': 9.133610451306413e-05, 'epoch': 2.76} + 14%|██████████ | 2462/17840 [4:10:28<27:38:19, 6.47s/it]g-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:31,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:31,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6768, 'learning_rate': 9.133016627078385e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:31,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:37,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:37,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0385, 'learning_rate': 9.132422802850357e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:37,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:43,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:43,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8485, 'learning_rate': 9.131828978622329e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:43,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:43,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:43,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:07,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:53<27:00:22, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:51,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:53<27:00:22, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:51,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:53<27:00:22, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:51,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:53<27:00:22, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:51,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2467/17840 [4:10:59<26:44:54, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2467/17840 [4:10:59<26:44:54, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:02,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:02,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7999, 'learning_rate': 9.130047505938243e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:02,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:02,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:08,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:08,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:08,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:08,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:13,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:13,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:17,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:17,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2471/17840 [4:11:22<25:04:22, 5.87s/it]g-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:22,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:22,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:22,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:57,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2472/17840 [4:11:28<24:39:41, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2472/17840 [4:11:28<24:39:41, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2472/17840 [4:11:28<24:39:41, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:30,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:30,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:34,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:34,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2474/17840 [4:11:38<23:25:32, 5.49s/it]g-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:37,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:37,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:37,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2475/17840 [4:11:45<25:22:46, 5.95s/it]g-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2475/17840 [4:11:45<25:22:46, 5.95s/it]g-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:46,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:46,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:26,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2476/17840 [4:11:50<23:55:06, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:48,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:50,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:48,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:50,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:48,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2477/17840 [4:11:54<22:30:36, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:52,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:54,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:52,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:54,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:52,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2478/17840 [4:11:58<21:01:47, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:56,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:56,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:56,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2479/17840 [4:12:02<19:28:36, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:00,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:02,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:00,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:02,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:00,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2480/17840 [4:12:05<17:54:46, 4.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:03,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2480/17840 [4:12:05<17:54:46, 4.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:03,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2481/17840 [4:12:08<16:20:08, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:06,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2481/17840 [4:12:08<16:20:08, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:06,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2482/17840 [4:12:11<14:50:08, 3.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:09,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:10,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:09,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:10,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:09,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:12:16<12:06:15, 2.84s/it]g-point operations will not be computed-17 20:53:11,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:12:16<12:06:15, 2.84s/it]g-point operations will not be computed-17 20:53:11,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:12:16<12:06:15, 2.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:12:16<12:06:15, 2.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:18,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:18,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:12:23<18:24:23, 4.32s/it]g-point operations will not be computed-17 20:53:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:12:23<18:24:23, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:12:23<18:24:23, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:26,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:26,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:12:31<22:37:40, 5.31s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:12:31<22:37:40, 5.31s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:12:31<22:37:40, 5.31s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:12:31<22:37:40, 5.31s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:12:31<22:37:40, 5.31s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:12:38<25:24:33, 5.96s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:39,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:39,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:12:46<27:17:38, 6.40s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:12:46<27:17:38, 6.40s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0655, 'learning_rate': 9.118171021377673e-05, 'epoch': 2.79} + 14%|██████████▏ | 2488/17840 [4:12:46<27:17:38, 6.40s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:12:46<27:17:38, 6.40s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:12:46<27:17:38, 6.40s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:53<28:40:06, 6.72s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:53<28:40:06, 6.72s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:53<28:40:06, 6.72s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:53<28:40:06, 6.72s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:53<28:40:06, 6.72s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:13:01<29:28:10, 6.91s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:01,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:01,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:13:08<29:57:48, 7.03s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:13:08<29:57:48, 7.03s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6672, 'learning_rate': 9.116389548693587e-05, 'epoch': 2.79} + 14%|██████████▏ | 2491/17840 [4:13:08<29:57:48, 7.03s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:13:08<29:57:48, 7.03s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:13:08<29:57:48, 7.03s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:13:15<30:11:23, 7.08s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:13:15<30:11:23, 7.08s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:13:15<30:11:23, 7.08s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:19,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:19,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7512, 'learning_rate': 9.11520190023753e-05, 'epoch': 2.79} +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:19,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:19,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:19,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2494/17840 [4:13:30<30:23:56, 7.13s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2494/17840 [4:13:30<30:23:56, 7.13s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:32,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:37<30:25:39, 7.14s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:37<30:25:39, 7.14s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.643, 'learning_rate': 9.114014251781473e-05, 'epoch': 2.8} + 14%|██████████▏ | 2495/17840 [4:13:37<30:25:39, 7.14s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:37<30:25:39, 7.14s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:37<30:25:39, 7.14s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2496/17840 [4:13:44<30:15:57, 7.10s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:44,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:44,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:13:51<30:08:05, 7.07s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:13:51<30:08:05, 7.07s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9635, 'learning_rate': 9.112826603325417e-05, 'epoch': 2.8} + 14%|██████████▏ | 2497/17840 [4:13:51<30:08:05, 7.07s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:13:51<30:08:05, 7.07s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:13:51<30:08:05, 7.07s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2498/17840 [4:13:58<30:03:56, 7.05s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:58,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:58,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:14:05<29:55:16, 7.02s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:14:05<29:55:16, 7.02s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7419, 'learning_rate': 9.11163895486936e-05, 'epoch': 2.8} + 14%|██████████▏ | 2499/17840 [4:14:05<29:55:16, 7.02s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:14:05<29:55:16, 7.02s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:14:05<29:55:16, 7.02s/it]g-point operations will not be computed-17 20:53:22,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2366] 2022-03-17 20:55:11,695 >> Num examples = 2642 | 2500/17840 [4:14:14<32:58:03, 7.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|trainer.py:2366] 2022-03-17 20:55:11,695 >> Num examples = 2642 | 2500/17840 [4:14:14<32:58:03, 7.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|trainer.py:2366] 2022-03-17 20:55:11,695 >> Num examples = 2642 | 2500/17840 [4:14:14<32:58:03, 7.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|▊ | 3/331 [00:04<08:50, 1.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|█ | 4/331 [00:06<10:00, 1.84s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|█ | 4/331 [00:06<10:00, 1.84s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|█ | 4/331 [00:06<10:00, 1.84s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▌ | 6/331 [00:12<12:20, 2.28s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▊ | 7/331 [00:14<12:28, 2.31s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|██ | 8/331 [00:16<12:44, 2.37s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▎ | 9/331 [00:19<13:22, 2.49s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▍ | 10/331 [00:22<14:18, 2.67s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▋ | 11/331 [00:25<13:48, 2.59s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|██▉ | 12/331 [00:27<13:34, 2.55s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▏ | 13/331 [00:30<13:21, 2.52s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▍ | 14/331 [00:32<13:14, 2.51s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▋ | 15/331 [00:35<14:24, 2.73s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▉ | 16/331 [00:39<15:20, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▏ | 17/331 [00:42<15:34, 2.97s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▍ | 18/331 [00:44<14:19, 2.75s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▋ | 19/331 [00:47<14:02, 2.70s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▉ | 20/331 [00:49<13:11, 2.55s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|█████▏ | 21/331 [00:52<13:42, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|█████▏ | 21/331 [00:52<13:42, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|█████▏ | 21/331 [00:52<13:42, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▋ | 23/331 [00:59<16:09, 3.15s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▉ | 24/331 [01:03<17:09, 3.35s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▏ | 25/331 [01:06<16:30, 3.24s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▍ | 26/331 [01:08<15:19, 3.01s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▋ | 27/331 [01:11<15:26, 3.05s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▉ | 28/331 [01:14<14:54, 2.95s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▏ | 29/331 [01:17<14:25, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▍ | 30/331 [01:19<13:45, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▋ | 31/331 [01:21<13:04, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|███████▉ | 32/331 [01:24<12:45, 2.56s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▏ | 33/331 [01:27<12:49, 2.58s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▍ | 34/331 [01:29<12:48, 2.59s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▋ | 35/331 [01:32<12:56, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▉ | 36/331 [01:35<13:38, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▏ | 37/331 [01:38<14:17, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▍ | 38/331 [01:41<14:28, 2.96s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▋ | 39/331 [01:44<14:32, 2.99s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▉ | 40/331 [01:47<13:21, 2.75s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|██████████▏ | 41/331 [01:49<12:44, 2.64s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▍ | 42/331 [01:52<13:35, 2.82s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▋ | 43/331 [01:56<14:23, 3.00s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▉ | 44/331 [01:59<14:50, 3.10s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▏ | 45/331 [02:01<14:00, 2.94s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▍ | 46/331 [02:04<12:59, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▋ | 47/331 [02:06<12:09, 2.57s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|███████████▉ | 48/331 [02:09<12:20, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|███████████▉ | 48/331 [02:09<12:20, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|███████████▉ | 48/331 [02:09<12:20, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▍ | 50/331 [02:14<12:46, 2.73s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▋ | 51/331 [02:17<13:05, 2.81s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|████████████▉ | 52/331 [02:20<12:27, 2.68s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▏ | 53/331 [02:22<12:27, 2.69s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▍ | 54/331 [02:25<11:54, 2.58s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▋ | 55/331 [02:28<13:00, 2.83s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▊ | 56/331 [02:31<12:50, 2.80s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|██████████████ | 57/331 [02:33<12:23, 2.71s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▎ | 58/331 [02:37<12:52, 2.83s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▌ | 59/331 [02:39<12:09, 2.68s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▊ | 60/331 [02:41<11:49, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|███████████████ | 61/331 [02:44<12:18, 2.73s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▎ | 62/331 [02:47<12:08, 2.71s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▌ | 63/331 [02:50<13:09, 2.94s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▊ | 64/331 [02:53<12:46, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████ | 65/331 [02:56<12:30, 2.82s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▎ | 66/331 [03:00<13:40, 3.10s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▌ | 67/331 [03:03<14:16, 3.25s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|████████████████▊ | 68/331 [03:07<14:21, 3.28s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████ | 69/331 [03:10<14:04, 3.22s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▎ | 70/331 [03:13<13:50, 3.18s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▌ | 71/331 [03:16<13:58, 3.23s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|█████████████████▊ | 72/331 [03:19<13:52, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████ | 73/331 [03:22<13:19, 3.10s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████▎ | 74/331 [03:25<12:59, 3.03s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▌ | 75/331 [03:28<13:13, 3.10s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▊ | 76/331 [03:31<12:31, 2.95s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|███████████████████ | 77/331 [03:34<12:13, 2.89s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▎ | 78/331 [03:36<11:43, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▌ | 79/331 [03:39<11:17, 2.69s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▊ | 80/331 [03:41<11:07, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|████████████████████ | 81/331 [03:44<11:35, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▎ | 82/331 [03:47<11:16, 2.72s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▌ | 83/331 [03:50<11:37, 2.81s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▊ | 84/331 [03:53<12:28, 3.03s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████ | 85/331 [03:56<11:34, 2.82s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▎ | 86/331 [03:59<12:11, 2.99s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▌ | 87/331 [04:02<11:54, 2.93s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|█████████████████████▊ | 88/331 [04:05<11:31, 2.85s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████ | 89/331 [04:07<10:39, 2.64s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▎ | 90/331 [04:09<10:08, 2.52s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▌ | 91/331 [04:12<10:36, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|██████████████████████▊ | 92/331 [04:14<09:53, 2.48s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████ | 93/331 [04:17<09:59, 2.52s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████▎ | 94/331 [04:19<10:15, 2.60s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▌ | 95/331 [04:22<10:20, 2.63s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▊ | 96/331 [04:25<10:26, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|████████████████████████ | 97/331 [04:27<10:01, 2.57s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▎ | 98/331 [04:30<10:25, 2.69s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▌ | 99/331 [04:33<10:26, 2.70s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▍ | 100/331 [04:35<09:59, 2.59s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▋ | 101/331 [04:38<09:52, 2.58s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▉ | 102/331 [04:41<10:37, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▏ | 103/331 [04:43<10:04, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▍ | 104/331 [04:46<10:03, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▋ | 105/331 [04:49<10:05, 2.68s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▉ | 106/331 [04:51<10:07, 2.70s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|██████████████████████████▏ | 107/331 [04:54<09:32, 2.55s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▍ | 108/331 [04:56<09:21, 2.52s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▋ | 109/331 [04:59<09:17, 2.51s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▉ | 110/331 [05:02<09:40, 2.63s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▏ | 111/331 [05:04<09:42, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▍ | 112/331 [05:07<09:41, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▋ | 113/331 [05:09<09:12, 2.53s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▉ | 114/331 [05:12<09:14, 2.56s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▏ | 115/331 [05:14<09:19, 2.59s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▍ | 116/331 [05:17<09:39, 2.70s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▋ | 117/331 [05:20<09:33, 2.68s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|████████████████████████████▉ | 118/331 [05:22<09:16, 2.61s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████ | 119/331 [05:25<09:14, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████▎ | 120/331 [05:28<09:15, 2.63s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▌ | 121/331 [05:31<09:39, 2.76s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▊ | 122/331 [05:33<09:30, 2.73s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████ | 123/331 [05:37<10:08, 2.93s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████▎ | 124/331 [05:40<09:56, 2.88s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▌ | 125/331 [05:43<10:34, 3.08s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▊ | 126/331 [05:46<10:36, 3.11s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|███████████████████████████████ | 127/331 [05:50<10:59, 3.23s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▎ | 128/331 [05:53<10:54, 3.22s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▌ | 129/331 [05:56<10:39, 3.17s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▊ | 130/331 [05:59<10:48, 3.23s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████ | 131/331 [06:03<10:56, 3.28s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▎ | 132/331 [06:06<10:17, 3.10s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▌ | 133/331 [06:08<09:35, 2.91s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▊ | 134/331 [06:11<09:13, 2.81s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████ | 135/331 [06:14<09:18, 2.85s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▎ | 136/331 [06:17<09:37, 2.96s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▌ | 137/331 [06:20<10:01, 3.10s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|█████████████████████████████████▊ | 138/331 [06:24<10:17, 3.20s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████ | 139/331 [06:26<09:08, 2.85s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████▎ | 140/331 [06:29<09:49, 3.08s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▌ | 141/331 [06:32<09:24, 2.97s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▋ | 142/331 [06:35<09:05, 2.89s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▉ | 143/331 [06:38<09:29, 3.03s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▏ | 144/331 [06:41<09:06, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▍ | 145/331 [06:44<08:58, 2.89s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▋ | 146/331 [06:47<09:23, 3.04s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▉ | 147/331 [06:50<09:03, 2.95s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▏ | 148/331 [06:52<08:31, 2.79s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▍ | 149/331 [06:54<08:03, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▋ | 150/331 [06:58<08:24, 2.79s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|████████████████████████████████████▉ | 151/331 [07:00<08:17, 2.76s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▏ | 152/331 [07:03<07:56, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▍ | 153/331 [07:05<07:45, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▋ | 154/331 [07:08<08:04, 2.73s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▉ | 155/331 [07:11<08:29, 2.89s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▏ | 156/331 [07:15<08:41, 2.98s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▍ | 157/331 [07:18<08:57, 3.09s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▋ | 158/331 [07:21<09:03, 3.14s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▉ | 159/331 [07:24<09:05, 3.17s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|███████████████████████████████████████▏ | 160/331 [07:27<08:32, 3.00s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▍ | 161/331 [07:30<08:15, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▋ | 162/331 [07:33<08:41, 3.08s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▉ | 163/331 [07:37<08:45, 3.13s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▏ | 164/331 [07:39<08:19, 2.99s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▍ | 165/331 [07:42<08:07, 2.94s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▌ | 166/331 [07:45<07:51, 2.86s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▊ | 167/331 [07:48<08:03, 2.95s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████ | 168/331 [07:50<07:40, 2.82s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▎ | 169/331 [07:53<07:48, 2.89s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▌ | 170/331 [07:56<07:22, 2.75s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|█████████████████████████████████████████▊ | 171/331 [07:59<07:18, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████ | 172/331 [08:01<07:01, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████▎ | 173/331 [08:04<07:12, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▌ | 174/331 [08:06<06:53, 2.63s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▊ | 175/331 [08:09<06:57, 2.67s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████ | 176/331 [08:12<06:44, 2.61s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████▎ | 177/331 [08:15<07:06, 2.77s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▌ | 178/331 [08:18<07:33, 2.96s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▊ | 179/331 [08:22<07:53, 3.12s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|████████████████████████████████████████████ | 180/331 [08:25<07:43, 3.07s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▎ | 181/331 [08:28<07:36, 3.04s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▌ | 182/331 [08:30<06:57, 2.80s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▊ | 183/331 [08:32<06:25, 2.60s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████ | 184/331 [08:34<06:02, 2.46s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▎ | 185/331 [08:36<05:40, 2.33s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▌ | 186/331 [08:39<05:49, 2.41s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▊ | 187/331 [08:42<06:21, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████ | 188/331 [08:45<06:19, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██��███████████████████████████████████████████▎ | 189/331 [08:47<06:02, 2.55s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▍ | 190/331 [08:49<05:46, 2.45s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▋ | 191/331 [08:51<05:40, 2.43s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▉ | 192/331 [08:54<05:28, 2.37s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|███████████████████████████████████████████████▏ | 193/331 [08:57<05:53, 2.56s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▍ | 194/331 [08:59<05:35, 2.45s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▋ | 195/331 [09:01<05:31, 2.43s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▉ | 196/331 [09:04<05:39, 2.51s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▏ | 197/331 [09:07<05:56, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▍ | 198/331 [09:09<05:37, 2.53s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▋ | 199/331 [09:12<05:38, 2.57s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▉ | 200/331 [09:14<05:21, 2.45s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▏ | 201/331 [09:16<05:17, 2.44s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▍ | 202/331 [09:19<05:25, 2.53s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▋ | 203/331 [09:22<05:26, 2.55s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|█████████████████████████████████████████████████▉ | 204/331 [09:25<05:46, 2.72s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▏ | 205/331 [09:28<05:48, 2.76s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▍ | 206/331 [09:30<05:40, 2.72s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▋ | 207/331 [09:34<05:56, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▉ | 208/331 [09:37<05:58, 2.91s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▏ | 209/331 [09:39<05:25, 2.67s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▍ | 210/331 [09:41<05:02, 2.50s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▋ | 211/331 [09:44<05:08, 2.57s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▉ | 212/331 [09:46<04:56, 2.49s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|████████████████████████████████████████████████████ | 213/331 [09:48<04:56, 2.51s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▎ | 214/331 [09:51<04:40, 2.40s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▌ | 215/331 [09:53<04:28, 2.31s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▊ | 216/331 [09:56<04:56, 2.58s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████ | 217/331 [09:59<04:56, 2.60s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▎ | 218/331 [10:02<05:09, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▌ | 219/331 [10:04<05:03, 2.71s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▊ | 220/331 [10:07<04:52, 2.63s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████ | 221/331 [10:09<04:54, 2.68s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▎ | 222/331 [10:12<04:42, 2.59s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▌ | 223/331 [10:15<04:44, 2.63s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|██████████████████████████████████████████████████████▊ | 224/331 [10:17<04:43, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████ | 225/331 [10:20<04:40, 2.64s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████▎ | 226/331 [10:23<04:52, 2.79s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▌ | 227/331 [10:26<04:45, 2.75s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▊ | 228/331 [10:28<04:36, 2.69s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████ | 229/331 [10:31<04:31, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████▎ | 230/331 [10:33<04:22, 2.60s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▌ | 231/331 [10:36<04:29, 2.70s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▊ | 232/331 [10:39<04:22, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|█████████████████████████████████████████████████████████ | 233/331 [10:42<04:29, 2.75s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▎ | 234/331 [10:44<04:14, 2.62s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▌ | 235/331 [10:46<04:04, 2.55s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|████████████████████████████████████████████████████���████▊ | 236/331 [10:50<04:30, 2.85s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|█████████████████████████████████████████████████████████▉ | 237/331 [10:53<04:42, 3.00s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▏ | 238/331 [10:56<04:39, 3.01s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▍ | 239/331 [10:59<04:40, 3.05s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▋ | 240/331 [11:03<04:44, 3.12s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▉ | 241/331 [11:06<04:48, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▏ | 242/331 [11:09<04:47, 3.23s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▍ | 243/331 [11:13<04:43, 3.22s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▋ | 244/331 [11:16<04:46, 3.29s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▉ | 245/331 [11:19<04:35, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|████████████████████████████████████████████████████████████▏ | 246/331 [11:23<04:45, 3.36s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▍ | 247/331 [11:26<04:35, 3.28s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▋ | 248/331 [11:29<04:14, 3.06s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▉ | 249/331 [11:31<03:54, 2.86s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▏ | 250/331 [11:33<03:41, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▍ | 251/331 [11:36<03:43, 2.79s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▋ | 252/331 [11:39<03:29, 2.66s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▉ | 253/331 [11:42<03:39, 2.81s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▏ | 254/331 [11:44<03:31, 2.75s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▍ | 255/331 [11:48<03:37, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▋ | 256/331 [11:50<03:29, 2.80s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|██████████████████████████████████████████████████████████████▉ | 257/331 [11:53<03:34, 2.90s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▏ | 258/331 [11:56<03:20, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▍ | 259/331 [11:58<03:13, 2.69s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▋ | 260/331 [12:01<03:15, 2.75s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▊ | 261/331 [12:03<03:02, 2.61s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████ | 262/331 [12:06<03:02, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████▎ | 263/331 [12:09<03:10, 2.80s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▌ | 264/331 [12:12<03:01, 2.71s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [12:14<02:54, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [12:14<02:54, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [12:14<02:54, 2.65s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▎ | 267/331 [12:20<02:55, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▌ | 268/331 [12:23<02:52, 2.74s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▊ | 269/331 [12:26<03:01, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████ | 270/331 [12:29<02:57, 2.90s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▎ | 271/331 [12:32<02:58, 2.98s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▌ | 272/331 [12:35<02:49, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [12:38<02:48, 2.91s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [12:38<02:48, 2.91s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [12:38<02:48, 2.91s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▎ | 275/331 [12:44<02:52, 3.09s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▌ | 276/331 [12:47<02:39, 2.91s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|███████████████████████████████████████████████████████████████████▊ | 277/331 [12:49<02:32, 2.82s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████ | 278/331 [12:52<02:27, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████▎ | 279/331 [12:56<02:37, 3.03s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▌ | 280/331 [12:58<02:31, 2.98s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▊ | 281/331 [13:02<02:33, 3.07s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████ | 282/331 [13:05<02:30, 3.06s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████▎ | 283/331 [13:08<02:31, 3.16s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▍ | 284/331 [13:12<02:33, 3.27s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▋ | 285/331 [13:15<02:31, 3.30s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▉ | 286/331 [13:18<02:29, 3.33s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▏ | 287/331 [13:22<02:30, 3.42s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▍ | 288/331 [13:25<02:25, 3.39s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [13:28<02:13, 3.19s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|██████████████████████████████████████████████████████████████████████▉ | 290/331 [13:31<02:03, 3.02s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▏ | 291/331 [13:33<01:54, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▍ | 292/331 [13:36<01:48, 2.79s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▋ | 293/331 [13:39<01:45, 2.77s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▉ | 294/331 [13:41<01:37, 2.63s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▏ | 295/331 [13:43<01:32, 2.56s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▍ | 296/331 [13:46<01:27, 2.49s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|███████████████████████████████████████████████████████████████████████���▋ | 297/331 [13:49<01:34, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▉ | 298/331 [13:53<01:39, 3.01s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [13:55<01:32, 2.90s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▍ | 300/331 [13:58<01:30, 2.90s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▋ | 301/331 [14:01<01:25, 2.86s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▉ | 302/331 [14:03<01:20, 2.77s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▏ | 303/331 [14:06<01:14, 2.67s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▍ | 304/331 [14:09<01:14, 2.76s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▋ | 305/331 [14:12<01:14, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████���███████████████████████████████████████████████████▉ | 306/331 [14:15<01:16, 3.05s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▏ | 307/331 [14:19<01:16, 3.19s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▎ | 308/331 [14:23<01:17, 3.36s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▌ | 309/331 [14:26<01:14, 3.40s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|███████████████████████████████████████████████████████████████████████████▊ | 310/331 [14:29<01:06, 3.18s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████ | 311/331 [14:32<01:03, 3.17s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████▎ | 312/331 [14:35<00:56, 2.97s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▌ | 313/331 [14:37<00:52, 2.90s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▊ | 314/331 [14:40<00:50, 2.95s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████ | 315/331 [14:44<00:48, 3.03s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████▎ | 316/331 [14:47<00:45, 3.06s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▌ | 317/331 [14:50<00:44, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▊ | 318/331 [14:53<00:39, 3.04s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|██████████████████████████████████████████████████████████████████████████████ | 319/331 [14:55<00:34, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▎ | 320/331 [14:58<00:31, 2.90s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▌ | 321/331 [15:01<00:28, 2.87s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [15:05<00:27, 3.02s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████ | 323/331 [15:07<00:23, 2.93s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [15:10<00:21, 3.03s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▌ | 325/331 [15:14<00:18, 3.04s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▊ | 326/331 [15:17<00:15, 3.11s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████ | 327/331 [15:20<00:12, 3.09s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▎| 328/331 [15:23<00:09, 3.11s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▌| 329/331 [15:26<00:06, 3.04s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [15:30<00:03, 3.22s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +100%|█████████████████████████████████████████████████████████████████████████████████| 331/331 [15:31<00:00, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +100%|█████████████████████████████████████████████████████████████████████████████████| 331/331 [15:31<00:00, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/17/2022 21:10:47 - INFO - datasets.metric - Removing /home/sanchit_huggingface_co/.cache/huggingface/metrics/wer/default/default_experiment-1-0.arrow +[INFO|configuration_utils.py:438] 2022-03-17 21:10:47,103 >> Configuration saved in ./checkpoint-2500/config.json [INFO|trainer.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-17 21:10:52,184 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-17 21:10:52,184 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-17 21:10:52,184 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-17 20:55:11,692 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/17/2022 21:11:12 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20220317_164055-2lyj41rg/run-2lyj41rg.wandb']. This may take a bit of time if the files are large.