diff --git a/eng-nah-svo-translation/README.md b/eng-nah-svo-translation/README.md
index ce0eb17a7e3f64e535bde10aecf80f6e420ae0d5..595cd1c823e82d0fb941138ae5d1c2db2bcf9fcf 100644
--- a/eng-nah-svo-translation/README.md
+++ b/eng-nah-svo-translation/README.md
@@ -16,8 +16,9 @@ should probably proofread and complete it, then remove this comment. -->
 
 This model was trained from scratch on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.3041
-- Bleu: 0.0
+- Loss: 0.2640
+- Bleu: 0.0231
+- Chrf: 26.4891
 
 ## Model description
 
diff --git a/eng-nah-svo-translation/checkpoint-228/optimizer.pt b/eng-nah-svo-translation/checkpoint-228/optimizer.pt
index 367852daa5323185ad585a47eaf94868eb9f51bc..731d033565bbb414bd9c0752c8e7822a64441f5e 100644
--- a/eng-nah-svo-translation/checkpoint-228/optimizer.pt
+++ b/eng-nah-svo-translation/checkpoint-228/optimizer.pt
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5190a17f19275c1af2d846140e4909e9d083e4c4f44fbfb42acad0530b174290
+oid sha256:b8c16511ba92e2355ca80c70207aa4e9e2f7fbdd9342fc1670e5380107108d33
 size 597088389
diff --git a/eng-nah-svo-translation/checkpoint-228/pytorch_model.bin b/eng-nah-svo-translation/checkpoint-228/pytorch_model.bin
index 6817a00807fe7434691386a71277c0602a3079f3..13aa597fce04805efbaf720d316390e64f4060b4 100644
--- a/eng-nah-svo-translation/checkpoint-228/pytorch_model.bin
+++ b/eng-nah-svo-translation/checkpoint-228/pytorch_model.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:140fc7491625eee2830a2bfde50a63b78cd6939bed1b4abeb189be50ab10980f
+oid sha256:37bcbd2252fb522e3c5ed42fb094b45769438bea8b0c374cc08a19277b5576cc
 size 298763205
diff --git a/eng-nah-svo-translation/checkpoint-228/trainer_state.json b/eng-nah-svo-translation/checkpoint-228/trainer_state.json
index 5b8815d4d0a1ead69943d491ff585e2e38488a38..85c3124b21752a2e98fb61253c068c3d94a6ab51 100644
--- a/eng-nah-svo-translation/checkpoint-228/trainer_state.json
+++ b/eng-nah-svo-translation/checkpoint-228/trainer_state.json
@@ -12,7 +12,7 @@
   "max_steps": 684,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 50445004308480.0,
+  "total_flos": 52376151785472.0,
   "trial_name": null,
   "trial_params": null
 }
diff --git a/eng-nah-svo-translation/checkpoint-228/training_args.bin b/eng-nah-svo-translation/checkpoint-228/training_args.bin
index 9994891ab867aee0045265c08dc1422280fe4490..bc1c45f9050b16d948a8f770690c1c16f5b66a30 100644
--- a/eng-nah-svo-translation/checkpoint-228/training_args.bin
+++ b/eng-nah-svo-translation/checkpoint-228/training_args.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06a45c37f0e7284c095b4b503ffa422c6b8f2791990e008912c3c06d6db7d538
+oid sha256:e056894aace19b2ad0614ec4c70099b961a9aaa0c0c2b1edfbe8e70c015294d2
 size 4219
diff --git a/eng-nah-svo-translation/checkpoint-456/optimizer.pt b/eng-nah-svo-translation/checkpoint-456/optimizer.pt
index 0a13ad28b840b4765c6190add7bcfe58651153ef..7e7dd0eaf15d89ca16f3a94f75a5661a6827ce95 100644
--- a/eng-nah-svo-translation/checkpoint-456/optimizer.pt
+++ b/eng-nah-svo-translation/checkpoint-456/optimizer.pt
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7de8c09d2c5d4f0096b953c55e83345013e4bcfb30df1f8899d8a579b549de65
+oid sha256:4f2fb78ceb69469a9888669142a52a24a22dfc567e2e35859abb89dcefc5c87f
 size 597088389
diff --git a/eng-nah-svo-translation/checkpoint-456/pytorch_model.bin b/eng-nah-svo-translation/checkpoint-456/pytorch_model.bin
index 7f4475ff8a860ad9d05afc5340714285ace04577..3c35017098b5c3d3e1d43d8f4b4e2373bb0ea919 100644
--- a/eng-nah-svo-translation/checkpoint-456/pytorch_model.bin
+++ b/eng-nah-svo-translation/checkpoint-456/pytorch_model.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef15720547c6e860442101e376eaa81dc981ef8521399ce751cfaf29fc229213
+oid sha256:46c8cd75372092eb227b14656a6abb4aede43d054867626ed0b59437dba56b84
 size 298763205
diff --git a/eng-nah-svo-translation/checkpoint-456/trainer_state.json b/eng-nah-svo-translation/checkpoint-456/trainer_state.json
index 1d8cdbc8c30e3bac7473146876de9199049ac3b0..cfb44e6f5d588e13471b5de0d1289d0c5409197d 100644
--- a/eng-nah-svo-translation/checkpoint-456/trainer_state.json
+++ b/eng-nah-svo-translation/checkpoint-456/trainer_state.json
@@ -12,7 +12,7 @@
   "max_steps": 684,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 100891067940864.0,
+  "total_flos": 104753362894848.0,
   "trial_name": null,
   "trial_params": null
 }
diff --git a/eng-nah-svo-translation/checkpoint-456/training_args.bin b/eng-nah-svo-translation/checkpoint-456/training_args.bin
index 9994891ab867aee0045265c08dc1422280fe4490..bc1c45f9050b16d948a8f770690c1c16f5b66a30 100644
--- a/eng-nah-svo-translation/checkpoint-456/training_args.bin
+++ b/eng-nah-svo-translation/checkpoint-456/training_args.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06a45c37f0e7284c095b4b503ffa422c6b8f2791990e008912c3c06d6db7d538
+oid sha256:e056894aace19b2ad0614ec4c70099b961a9aaa0c0c2b1edfbe8e70c015294d2
 size 4219
diff --git a/eng-nah-svo-translation/checkpoint-684/optimizer.pt b/eng-nah-svo-translation/checkpoint-684/optimizer.pt
index 1841d2af2b5d6fd70b37fcbe0ee34ce7dcd2760b..a97d5ecb97e4cd85f70ba786ddc66aea39423b88 100644
--- a/eng-nah-svo-translation/checkpoint-684/optimizer.pt
+++ b/eng-nah-svo-translation/checkpoint-684/optimizer.pt
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:19578c8bd50d0d5922742f052fdb7391eec55dd2ab281226cdcae8cd78356dd9
+oid sha256:330d85b27bca67820bebe7c7bd87bbfd73edfde6172890ffd2c8298d597a3c57
 size 597088389
diff --git a/eng-nah-svo-translation/checkpoint-684/pytorch_model.bin b/eng-nah-svo-translation/checkpoint-684/pytorch_model.bin
index 8cfef71fafeaa52d0e82916072a440084dce6704..afcd596c8b8632dcae71b3dc25fdd3e7a2ea3bb4 100644
--- a/eng-nah-svo-translation/checkpoint-684/pytorch_model.bin
+++ b/eng-nah-svo-translation/checkpoint-684/pytorch_model.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9f62408ea2e275aed7548ea31e37c534dd035154b3999483e0ed481c2dd1f9e2
+oid sha256:174c26a830bb38c835122d896e568f06abcf2e72976220ff513f32f769be682a
 size 298763205
diff --git a/eng-nah-svo-translation/checkpoint-684/trainer_state.json b/eng-nah-svo-translation/checkpoint-684/trainer_state.json
index e96724abfb0fd39ea715ff1d174d2912aed6c2dd..74a625dfe2e14489496fc7f4b120721df0419c53 100644
--- a/eng-nah-svo-translation/checkpoint-684/trainer_state.json
+++ b/eng-nah-svo-translation/checkpoint-684/trainer_state.json
@@ -11,7 +11,7 @@
     {
       "epoch": 2.19,
       "learning_rate": 5.380116959064328e-06,
-      "loss": 0.2276,
+      "loss": 0.1428,
       "step": 500
     }
   ],
@@ -19,7 +19,7 @@
   "max_steps": 684,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 151058529386496.0,
+  "total_flos": 156851971817472.0,
   "trial_name": null,
   "trial_params": null
 }
diff --git a/eng-nah-svo-translation/checkpoint-684/training_args.bin b/eng-nah-svo-translation/checkpoint-684/training_args.bin
index 9994891ab867aee0045265c08dc1422280fe4490..bc1c45f9050b16d948a8f770690c1c16f5b66a30 100644
--- a/eng-nah-svo-translation/checkpoint-684/training_args.bin
+++ b/eng-nah-svo-translation/checkpoint-684/training_args.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06a45c37f0e7284c095b4b503ffa422c6b8f2791990e008912c3c06d6db7d538
+oid sha256:e056894aace19b2ad0614ec4c70099b961a9aaa0c0c2b1edfbe8e70c015294d2
 size 4219
diff --git a/eng-nah-svo-translation/pytorch_model.bin b/eng-nah-svo-translation/pytorch_model.bin
index 8cfef71fafeaa52d0e82916072a440084dce6704..afcd596c8b8632dcae71b3dc25fdd3e7a2ea3bb4 100644
--- a/eng-nah-svo-translation/pytorch_model.bin
+++ b/eng-nah-svo-translation/pytorch_model.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9f62408ea2e275aed7548ea31e37c534dd035154b3999483e0ed481c2dd1f9e2
+oid sha256:174c26a830bb38c835122d896e568f06abcf2e72976220ff513f32f769be682a
 size 298763205
diff --git a/eng-nah-svo-translation/training_args.bin b/eng-nah-svo-translation/training_args.bin
index 9994891ab867aee0045265c08dc1422280fe4490..bc1c45f9050b16d948a8f770690c1c16f5b66a30 100644
--- a/eng-nah-svo-translation/training_args.bin
+++ b/eng-nah-svo-translation/training_args.bin
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06a45c37f0e7284c095b4b503ffa422c6b8f2791990e008912c3c06d6db7d538
+oid sha256:e056894aace19b2ad0614ec4c70099b961a9aaa0c0c2b1edfbe8e70c015294d2
 size 4219
diff --git a/myerrors_1551.out b/myerrors_1551.out
deleted file mode 100644
index ab65a5a7401763e92b51f249db9d4702764cdce0..0000000000000000000000000000000000000000
--- a/myerrors_1551.out
+++ /dev/null
@@ -1,34 +0,0 @@
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-Using pad_token, but it is not set yet.
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 130, in <module>
-    trainer.evaluate(max_length=max_length)
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 159, in evaluate
-    return super().evaluate(eval_dataset, ignore_keys=ignore_keys, metric_key_prefix=metric_key_prefix)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 2972, in evaluate
-    output = eval_loop(
-             ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 3151, in evaluation_loop
-    for step, inputs in enumerate(dataloader):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/accelerate/data_loader.py", line 384, in __iter__
-    current_batch = next(dataloader_iter)
-                    ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 633, in __next__
-    data = self._next_data()
-           ^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 677, in _next_data
-    data = self._dataset_fetcher.fetch(index)  # may raise StopIteration
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/_utils/fetch.py", line 54, in fetch
-    return self.collate_fn(data)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/data/data_collator.py", line 586, in __call__
-    features = self.tokenizer.pad(
-               ^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/tokenization_utils_base.py", line 3059, in pad
-    padding_strategy, _, max_length, _ = self._get_padding_truncation_strategies(
-                                         ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/tokenization_utils_base.py", line 2507, in _get_padding_truncation_strategies
-    raise ValueError(
-ValueError: Asking to pad but the tokenizer does not have a padding token. Please select a token to use as `pad_token` `(tokenizer.pad_token = tokenizer.eos_token e.g.)` or add a new pad token via `tokenizer.add_special_tokens({'pad_token': '[PAD]'})`.
diff --git a/myerrors_1552.out b/myerrors_1552.out
deleted file mode 100644
index f6f885aa01e57e2d5410aa3d681f4a024427cb0c..0000000000000000000000000000000000000000
--- a/myerrors_1552.out
+++ /dev/null
@@ -1,29 +0,0 @@
-Map:   0%|          | 0/7292 [00:00<?, ? examples/s]Map:  27%|██▋       | 2000/7292 [00:00<00:00, 9056.99 examples/s]Map:  82%|████████▏ | 6000/7292 [00:00<00:00, 17405.96 examples/s]Map: 100%|██████████| 7292/7292 [00:00<00:00, 17292.17 examples/s]
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 28511.75 examples/s]
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 30926.57 examples/s]
-Downloading (…)lve/main/config.json:   0%|          | 0.00/570 [00:00<?, ?B/s]Downloading (…)lve/main/config.json: 100%|██████████| 570/570 [00:00<00:00, 1.74MB/s]
-Downloading model.safetensors:   0%|          | 0.00/436M [00:00<?, ?B/s]Downloading model.safetensors:   2%|▏         | 10.5M/436M [00:00<00:05, 71.5MB/s]Downloading model.safetensors:   5%|▍         | 21.0M/436M [00:00<00:04, 86.4MB/s]Downloading model.safetensors:  10%|▉         | 41.9M/436M [00:00<00:03, 102MB/s] Downloading model.safetensors:  14%|█▍        | 62.9M/436M [00:00<00:03, 108MB/s]Downloading model.safetensors:  19%|█▉        | 83.9M/436M [00:00<00:03, 111MB/s]Downloading model.safetensors:  24%|██▍       | 105M/436M [00:00<00:02, 112MB/s] Downloading model.safetensors:  29%|██▉       | 126M/436M [00:01<00:02, 113MB/s]Downloading model.safetensors:  34%|███▎      | 147M/436M [00:01<00:02, 114MB/s]Downloading model.safetensors:  39%|███▊      | 168M/436M [00:01<00:02, 114MB/s]Downloading model.safetensors:  43%|████▎     | 189M/436M [00:01<00:02, 114MB/s]Downloading model.safetensors:  48%|████▊     | 210M/436M [00:01<00:02, 112MB/s]Downloading model.safetensors:  53%|█████▎    | 231M/436M [00:02<00:01, 114MB/s]Downloading model.safetensors:  58%|█████▊    | 252M/436M [00:02<00:01, 113MB/s]Downloading model.safetensors:  63%|██████▎   | 273M/436M [00:02<00:01, 114MB/s]Downloading model.safetensors:  67%|██████▋   | 294M/436M [00:02<00:01, 115MB/s]Downloading model.safetensors:  72%|███████▏  | 315M/436M [00:02<00:01, 114MB/s]Downloading model.safetensors:  77%|███████▋  | 336M/436M [00:03<00:00, 113MB/s]Downloading model.safetensors:  82%|████████▏ | 357M/436M [00:03<00:00, 115MB/s]Downloading model.safetensors:  87%|████████▋ | 377M/436M [00:03<00:00, 115MB/s]Downloading model.safetensors:  91%|█████████▏| 398M/436M [00:03<00:00, 114MB/s]Downloading model.safetensors:  96%|█████████▋| 419M/436M [00:03<00:00, 115MB/s]Downloading model.safetensors: 100%|██████████| 436M/436M [00:03<00:00, 115MB/s]Downloading model.safetensors: 100%|██████████| 436M/436M [00:03<00:00, 112MB/s]
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 131, in <module>
-    trainer.evaluate(max_length=max_length)
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 159, in evaluate
-    return super().evaluate(eval_dataset, ignore_keys=ignore_keys, metric_key_prefix=metric_key_prefix)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 2972, in evaluate
-    output = eval_loop(
-             ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 3161, in evaluation_loop
-    loss, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
-                           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 282, in prediction_step
-    generated_tokens = self.model.generate(**inputs, **gen_kwargs)
-                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 1402, in generate
-    self._validate_model_class()
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 1197, in _validate_model_class
-    raise TypeError(exception_message)
-TypeError: The current model class (BertModel) is not compatible with `.generate()`, as it doesn't have a language model head. Please use one of the following classes instead: {'BertLMHeadModel'}
diff --git a/myerrors_1553.out b/myerrors_1553.out
deleted file mode 100644
index f0089959e2078c121c14d02c46798e99bb2f5bc7..0000000000000000000000000000000000000000
--- a/myerrors_1553.out
+++ /dev/null
@@ -1,25 +0,0 @@
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 10677.82 examples/s]
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 131, in <module>
-    trainer.evaluate(max_length=max_length)
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 159, in evaluate
-    return super().evaluate(eval_dataset, ignore_keys=ignore_keys, metric_key_prefix=metric_key_prefix)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 2972, in evaluate
-    output = eval_loop(
-             ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 3161, in evaluation_loop
-    loss, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
-                           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 282, in prediction_step
-    generated_tokens = self.model.generate(**inputs, **gen_kwargs)
-                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 1402, in generate
-    self._validate_model_class()
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 1197, in _validate_model_class
-    raise TypeError(exception_message)
-TypeError: The current model class (BertModel) is not compatible with `.generate()`, as it doesn't have a language model head. Please use one of the following classes instead: {'BertLMHeadModel'}
diff --git a/myerrors_1554.out b/myerrors_1554.out
deleted file mode 100644
index 4c8a4883571c0064f7dd045ef0e867085b2f6fa5..0000000000000000000000000000000000000000
--- a/myerrors_1554.out
+++ /dev/null
@@ -1,165 +0,0 @@
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 13523.69 examples/s]
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [0,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [1,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [2,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [3,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [4,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [5,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [6,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [7,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [8,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [9,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [10,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [11,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [12,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [13,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [14,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [15,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [16,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [17,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [18,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [19,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [20,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [21,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [22,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [23,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [24,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [25,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [26,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [27,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [28,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [29,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [30,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [18,0,0], thread: [31,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [64,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [65,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [66,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [67,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [68,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [69,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [70,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [71,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [72,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [73,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [74,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [75,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [76,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [77,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [78,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [79,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [80,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [81,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [82,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [83,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [84,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [85,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [86,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [87,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [88,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [89,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [90,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [91,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [92,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [93,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [94,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [166,0,0], thread: [95,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 131, in <module>
-    trainer.evaluate(max_length=max_length)
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 159, in evaluate
-    return super().evaluate(eval_dataset, ignore_keys=ignore_keys, metric_key_prefix=metric_key_prefix)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 2972, in evaluate
-    output = eval_loop(
-             ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 3161, in evaluation_loop
-    loss, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
-                           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 282, in prediction_step
-    generated_tokens = self.model.generate(**inputs, **gen_kwargs)
-                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 1596, in generate
-    return self.greedy_search(
-           ^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 2444, in greedy_search
-    outputs = self(
-              ^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 1235, in forward
-    outputs = self.bert(
-              ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 1022, in forward
-    encoder_outputs = self.encoder(
-                      ^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 612, in forward
-    layer_outputs = layer_module(
-                    ^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 497, in forward
-    self_attention_outputs = self.attention(
-                             ^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 427, in forward
-    self_outputs = self.self(
-                   ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 286, in forward
-    mixed_query_layer = self.query(hidden_states)
-                        ^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/linear.py", line 114, in forward
-    return F.linear(input, self.weight, self.bias)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-RuntimeError: CUDA error: CUBLAS_STATUS_NOT_INITIALIZED when calling `cublasCreate(handle)`
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [96,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [97,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [98,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [99,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [100,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [101,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [102,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [103,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [104,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [105,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [106,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [107,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [108,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [109,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [110,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [111,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [112,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [113,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [114,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [115,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [116,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [117,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [118,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [119,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [120,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [121,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [122,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [123,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [124,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [125,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [126,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [161,0,0], thread: [127,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
diff --git a/myerrors_1555.out b/myerrors_1555.out
deleted file mode 100644
index 85e68c9fc635ed6872b05f9a4dbb9af44f37d515..0000000000000000000000000000000000000000
--- a/myerrors_1555.out
+++ /dev/null
@@ -1,46 +0,0 @@
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:32,  2.29s/it] 19%|█▉        | 3/16 [00:09<00:41,  3.19s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.66s/it] 31%|███▏      | 5/16 [00:17<00:43,  3.93s/it] 38%|███▊      | 6/16 [00:22<00:40,  4.10s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.21s/it] 50%|█████     | 8/16 [00:31<00:34,  4.28s/it] 56%|█████▋    | 9/16 [00:35<00:30,  4.33s/it] 62%|██████▎   | 10/16 [00:40<00:26,  4.36s/it] 69%|██████▉   | 11/16 [00:44<00:21,  4.38s/it] 75%|███████▌  | 12/16 [00:48<00:17,  4.39s/it] 81%|████████▏ | 13/16 [00:53<00:13,  4.41s/it] 88%|████████▊ | 14/16 [00:57<00:08,  4.41s/it] 94%|█████████▍| 15/16 [01:02<00:04,  4.42s/it]100%|██████████| 16/16 [01:05<00:00,  4.03s/it]100%|██████████| 16/16 [01:05<00:00,  4.11s/it]
-  0%|          | 0/684 [00:00<?, ?it/s]  0%|          | 1/684 [00:00<02:37,  4.33it/s]  0%|          | 3/684 [00:00<01:15,  8.97it/s]  1%|          | 5/684 [00:00<01:02, 10.92it/s]  1%|          | 7/684 [00:00<00:56, 11.98it/s]  1%|▏         | 9/684 [00:00<00:53, 12.60it/s]  2%|▏         | 11/684 [00:00<00:51, 12.95it/s]  2%|▏         | 13/684 [00:01<00:50, 13.17it/s]  2%|▏         | 15/684 [00:01<00:50, 13.37it/s]  2%|▏         | 17/684 [00:01<00:49, 13.46it/s]  3%|▎         | 19/684 [00:01<00:49, 13.55it/s]  3%|▎         | 21/684 [00:01<00:48, 13.58it/s]  3%|▎         | 23/684 [00:01<00:48, 13.61it/s]  4%|▎         | 25/684 [00:01<00:48, 13.68it/s]  4%|▍         | 27/684 [00:02<00:48, 13.68it/s]  4%|▍         | 29/684 [00:02<00:47, 13.71it/s]  5%|▍         | 31/684 [00:02<00:47, 13.73it/s]  5%|▍         | 33/684 [00:02<00:47, 13.70it/s]  5%|▌         | 35/684 [00:02<00:47, 13.69it/s]  5%|▌         | 37/684 [00:02<00:47, 13.70it/s]  6%|▌         | 39/684 [00:02<00:47, 13.71it/s]  6%|▌         | 41/684 [00:03<00:46, 13.71it/s]  6%|▋         | 43/684 [00:03<00:46, 13.76it/s]  7%|▋         | 45/684 [00:03<00:46, 13.76it/s]  7%|▋         | 47/684 [00:03<00:46, 13.82it/s]  7%|▋         | 49/684 [00:03<00:45, 13.82it/s]  7%|▋         | 51/684 [00:03<00:45, 13.82it/s]  8%|▊         | 53/684 [00:04<00:45, 13.79it/s]  8%|▊         | 55/684 [00:04<00:45, 13.81it/s]  8%|▊         | 57/684 [00:04<00:45, 13.77it/s]  9%|▊         | 59/684 [00:04<00:45, 13.83it/s]  9%|▉         | 61/684 [00:04<00:44, 13.85it/s]  9%|▉         | 63/684 [00:04<00:44, 13.84it/s] 10%|▉         | 65/684 [00:04<00:44, 13.79it/s] 10%|▉         | 67/684 [00:05<00:44, 13.79it/s] 10%|█         | 69/684 [00:05<00:44, 13.77it/s] 10%|█         | 71/684 [00:05<00:44, 13.78it/s] 11%|█         | 73/684 [00:05<00:44, 13.78it/s] 11%|█         | 75/684 [00:05<00:44, 13.80it/s] 11%|█▏        | 77/684 [00:05<00:43, 13.81it/s] 12%|█▏        | 79/684 [00:05<00:43, 13.83it/s] 12%|█▏        | 81/684 [00:06<00:43, 13.79it/s] 12%|█▏        | 83/684 [00:06<00:43, 13.86it/s] 12%|█▏        | 85/684 [00:06<00:43, 13.79it/s] 13%|█▎        | 87/684 [00:06<00:43, 13.75it/s] 13%|█▎        | 89/684 [00:06<00:43, 13.77it/s] 13%|█▎        | 91/684 [00:06<00:43, 13.74it/s] 14%|█▎        | 93/684 [00:06<00:42, 13.75it/s] 14%|█▍        | 95/684 [00:07<00:42, 13.76it/s] 14%|█▍        | 97/684 [00:07<00:42, 13.75it/s] 14%|█▍        | 99/684 [00:07<00:42, 13.70it/s] 15%|█▍        | 101/684 [00:07<00:42, 13.76it/s] 15%|█▌        | 103/684 [00:07<00:42, 13.68it/s] 15%|█▌        | 105/684 [00:07<00:42, 13.73it/s] 16%|█▌        | 107/684 [00:07<00:41, 13.75it/s] 16%|█▌        | 109/684 [00:08<00:41, 13.71it/s] 16%|█▌        | 111/684 [00:08<00:41, 13.74it/s] 17%|█▋        | 113/684 [00:08<00:41, 13.78it/s] 17%|█▋        | 115/684 [00:08<00:41, 13.80it/s] 17%|█▋        | 117/684 [00:08<00:41, 13.78it/s] 17%|█▋        | 119/684 [00:08<00:41, 13.75it/s] 18%|█▊        | 121/684 [00:08<00:40, 13.77it/s] 18%|█▊        | 123/684 [00:09<00:40, 13.78it/s] 18%|█▊        | 125/684 [00:09<00:40, 13.74it/s] 19%|█▊        | 127/684 [00:09<00:40, 13.77it/s] 19%|█▉        | 129/684 [00:09<00:40, 13.78it/s] 19%|█▉        | 131/684 [00:09<00:40, 13.78it/s] 19%|█▉        | 133/684 [00:09<00:39, 13.81it/s] 20%|█▉        | 135/684 [00:09<00:39, 13.78it/s] 20%|██        | 137/684 [00:10<00:39, 13.76it/s] 20%|██        | 139/684 [00:10<00:39, 13.75it/s] 21%|██        | 141/684 [00:10<00:39, 13.76it/s] 21%|██        | 143/684 [00:10<00:39, 13.72it/s] 21%|██        | 145/684 [00:10<00:39, 13.74it/s] 21%|██▏       | 147/684 [00:10<00:39, 13.75it/s] 22%|██▏       | 149/684 [00:10<00:38, 13.76it/s] 22%|██▏       | 151/684 [00:11<00:38, 13.75it/s] 22%|██▏       | 153/684 [00:11<00:38, 13.70it/s] 23%|██▎       | 155/684 [00:11<00:38, 13.76it/s] 23%|██▎       | 157/684 [00:11<00:38, 13.78it/s] 23%|██▎       | 159/684 [00:11<00:38, 13.79it/s] 24%|██▎       | 161/684 [00:11<00:38, 13.75it/s] 24%|██▍       | 163/684 [00:11<00:37, 13.78it/s] 24%|██▍       | 165/684 [00:12<00:37, 13.76it/s] 24%|██▍       | 167/684 [00:12<00:37, 13.78it/s] 25%|██▍       | 169/684 [00:12<00:37, 13.82it/s] 25%|██▌       | 171/684 [00:12<00:37, 13.82it/s] 25%|██▌       | 173/684 [00:12<00:37, 13.74it/s] 26%|██▌       | 175/684 [00:12<00:37, 13.74it/s] 26%|██▌       | 177/684 [00:13<00:36, 13.76it/s] 26%|██▌       | 179/684 [00:13<00:36, 13.76it/s] 26%|██▋       | 181/684 [00:13<00:36, 13.79it/s] 27%|██▋       | 183/684 [00:13<00:36, 13.79it/s] 27%|██▋       | 185/684 [00:13<00:36, 13.74it/s] 27%|██▋       | 187/684 [00:13<00:36, 13.71it/s] 28%|██▊       | 189/684 [00:13<00:36, 13.68it/s] 28%|██▊       | 191/684 [00:14<00:35, 13.71it/s] 28%|██▊       | 193/684 [00:14<00:35, 13.73it/s] 29%|██▊       | 195/684 [00:14<00:35, 13.76it/s] 29%|██▉       | 197/684 [00:14<00:35, 13.76it/s] 29%|██▉       | 199/684 [00:14<00:35, 13.76it/s] 29%|██▉       | 201/684 [00:14<00:35, 13.75it/s] 30%|██▉       | 203/684 [00:14<00:34, 13.76it/s] 30%|██▉       | 205/684 [00:15<00:34, 13.77it/s] 30%|███       | 207/684 [00:15<00:34, 13.77it/s] 31%|███       | 209/684 [00:15<00:34, 13.75it/s] 31%|███       | 211/684 [00:15<00:34, 13.78it/s] 31%|███       | 213/684 [00:15<00:34, 13.79it/s] 31%|███▏      | 215/684 [00:15<00:34, 13.76it/s] 32%|███▏      | 217/684 [00:15<00:33, 13.79it/s] 32%|███▏      | 219/684 [00:16<00:33, 13.78it/s] 32%|███▏      | 221/684 [00:16<00:33, 13.76it/s] 33%|███▎      | 223/684 [00:16<00:33, 13.74it/s] 33%|███▎      | 225/684 [00:16<00:33, 13.76it/s] 33%|███▎      | 227/684 [00:16<00:33, 13.71it/s] 33%|███▎      | 229/684 [00:18<02:47,  2.72it/s] 34%|███▍      | 231/684 [00:18<02:05,  3.60it/s] 34%|███▍      | 233/684 [00:19<01:36,  4.68it/s] 34%|███▍      | 235/684 [00:19<01:15,  5.94it/s] 35%|███▍      | 237/684 [00:19<01:01,  7.28it/s] 35%|███▍      | 239/684 [00:19<00:52,  8.41it/s] 35%|███▌      | 241/684 [00:19<00:48,  9.21it/s] 36%|███▌      | 243/684 [00:19<00:43, 10.20it/s] 36%|███▌      | 245/684 [00:19<00:41, 10.62it/s] 36%|███▌      | 247/684 [00:20<00:38, 11.40it/s] 36%|███▋      | 249/684 [00:20<00:37, 11.67it/s] 37%|███▋      | 251/684 [00:20<00:36, 12.03it/s] 37%|███▋      | 253/684 [00:20<00:35, 12.23it/s] 37%|███▋      | 255/684 [00:20<00:34, 12.34it/s] 38%|███▊      | 257/684 [00:20<00:33, 12.58it/s] 38%|███▊      | 259/684 [00:21<00:34, 12.42it/s] 38%|███▊      | 261/684 [00:21<00:33, 12.70it/s] 38%|███▊      | 263/684 [00:21<00:33, 12.51it/s] 39%|███▊      | 265/684 [00:21<00:33, 12.56it/s] 39%|███▉      | 267/684 [00:21<00:32, 12.69it/s] 39%|███▉      | 269/684 [00:21<00:33, 12.52it/s] 40%|███▉      | 271/684 [00:21<00:32, 12.82it/s] 40%|███▉      | 273/684 [00:22<00:32, 12.64it/s] 40%|████      | 275/684 [00:22<00:32, 12.76it/s] 40%|████      | 277/684 [00:22<00:31, 12.84it/s] 41%|████      | 279/684 [00:22<00:31, 12.73it/s] 41%|████      | 281/684 [00:22<00:31, 12.92it/s] 41%|████▏     | 283/684 [00:22<00:31, 12.74it/s] 42%|████▏     | 285/684 [00:23<00:31, 12.54it/s] 42%|████▏     | 287/684 [00:23<00:30, 12.95it/s] 42%|████▏     | 289/684 [00:23<00:30, 12.77it/s] 43%|████▎     | 291/684 [00:23<00:29, 13.11it/s] 43%|████▎     | 293/684 [00:23<00:30, 12.92it/s] 43%|████▎     | 295/684 [00:23<00:30, 12.73it/s] 43%|████▎     | 297/684 [00:23<00:30, 12.69it/s] 44%|████▎     | 299/684 [00:24<00:29, 13.13it/s] 44%|████▍     | 301/684 [00:24<00:28, 13.28it/s] 44%|████▍     | 303/684 [00:24<00:28, 13.42it/s] 45%|████▍     | 305/684 [00:24<00:29, 12.88it/s] 45%|████▍     | 307/684 [00:24<00:29, 12.74it/s] 45%|████▌     | 309/684 [00:24<00:28, 12.93it/s] 45%|████▌     | 311/684 [00:25<00:29, 12.72it/s] 46%|████▌     | 313/684 [00:25<00:28, 13.16it/s] 46%|████▌     | 315/684 [00:25<00:28, 13.01it/s] 46%|████▋     | 317/684 [00:25<00:28, 13.02it/s] 47%|████▋     | 319/684 [00:25<00:27, 13.24it/s] 47%|████▋     | 321/684 [00:25<00:26, 13.54it/s] 47%|████▋     | 323/684 [00:25<00:26, 13.63it/s] 48%|████▊     | 325/684 [00:26<00:26, 13.68it/s] 48%|████▊     | 327/684 [00:26<00:26, 13.68it/s] 48%|████▊     | 329/684 [00:26<00:25, 13.69it/s] 48%|████▊     | 331/684 [00:26<00:25, 13.76it/s] 49%|████▊     | 333/684 [00:26<00:25, 13.78it/s] 49%|████▉     | 335/684 [00:26<00:25, 13.75it/s] 49%|████▉     | 337/684 [00:26<00:25, 13.76it/s] 50%|████▉     | 339/684 [00:27<00:25, 13.79it/s] 50%|████▉     | 341/684 [00:27<00:24, 13.75it/s] 50%|█████     | 343/684 [00:27<00:24, 13.70it/s] 50%|█████     | 345/684 [00:27<00:24, 13.81it/s] 51%|█████     | 347/684 [00:27<00:24, 13.84it/s] 51%|█████     | 349/684 [00:27<00:24, 13.83it/s] 51%|█████▏    | 351/684 [00:27<00:24, 13.77it/s] 52%|█████▏    | 353/684 [00:28<00:24, 13.70it/s] 52%|█████▏    | 355/684 [00:28<00:23, 13.74it/s] 52%|█████▏    | 357/684 [00:28<00:23, 13.77it/s] 52%|█████▏    | 359/684 [00:28<00:23, 13.76it/s] 53%|█████▎    | 361/684 [00:28<00:23, 13.77it/s] 53%|█████▎    | 363/684 [00:28<00:23, 13.75it/s] 53%|█████▎    | 365/684 [00:28<00:23, 13.73it/s] 54%|█████▎    | 367/684 [00:29<00:23, 13.74it/s] 54%|█████▍    | 369/684 [00:29<00:22, 13.81it/s] 54%|█████▍    | 371/684 [00:29<00:22, 13.83it/s] 55%|█████▍    | 373/684 [00:29<00:22, 13.83it/s] 55%|█████▍    | 375/684 [00:29<00:22, 13.84it/s] 55%|█████▌    | 377/684 [00:29<00:22, 13.82it/s] 55%|█████▌    | 379/684 [00:30<00:22, 13.81it/s] 56%|█████▌    | 381/684 [00:30<00:21, 13.80it/s] 56%|█████▌    | 383/684 [00:30<00:21, 13.76it/s] 56%|█████▋    | 385/684 [00:30<00:21, 13.79it/s] 57%|█████▋    | 387/684 [00:30<00:21, 13.82it/s] 57%|█████▋    | 389/684 [00:30<00:21, 13.75it/s] 57%|█████▋    | 391/684 [00:30<00:21, 13.73it/s] 57%|█████▋    | 393/684 [00:31<00:21, 13.75it/s] 58%|█████▊    | 395/684 [00:31<00:21, 13.75it/s] 58%|█████▊    | 397/684 [00:31<00:20, 13.72it/s] 58%|█████▊    | 399/684 [00:31<00:20, 13.76it/s] 59%|█████▊    | 401/684 [00:31<00:20, 13.78it/s] 59%|█████▉    | 403/684 [00:31<00:20, 13.75it/s] 59%|█████▉    | 405/684 [00:31<00:20, 13.77it/s] 60%|█████▉    | 407/684 [00:32<00:20, 13.72it/s] 60%|█████▉    | 409/684 [00:32<00:20, 13.73it/s] 60%|██████    | 411/684 [00:32<00:19, 13.76it/s] 60%|██████    | 413/684 [00:32<00:19, 13.77it/s] 61%|██████    | 415/684 [00:32<00:19, 13.75it/s] 61%|██████    | 417/684 [00:32<00:19, 13.70it/s] 61%|██████▏   | 419/684 [00:32<00:19, 13.68it/s] 62%|██████▏   | 421/684 [00:33<00:19, 13.69it/s] 62%|██████▏   | 423/684 [00:33<00:19, 13.70it/s] 62%|██████▏   | 425/684 [00:33<00:18, 13.70it/s] 62%|██████▏   | 427/684 [00:33<00:18, 13.72it/s] 63%|██████▎   | 429/684 [00:33<00:18, 13.76it/s] 63%|██████▎   | 431/684 [00:33<00:18, 13.75it/s] 63%|██████▎   | 433/684 [00:33<00:18, 13.77it/s] 64%|██████▎   | 435/684 [00:34<00:18, 13.78it/s] 64%|██████▍   | 437/684 [00:34<00:17, 13.76it/s] 64%|██████▍   | 439/684 [00:34<00:17, 13.79it/s] 64%|██████▍   | 441/684 [00:34<00:17, 13.81it/s] 65%|██████▍   | 443/684 [00:34<00:17, 13.77it/s] 65%|██████▌   | 445/684 [00:34<00:17, 13.76it/s] 65%|██████▌   | 447/684 [00:34<00:17, 13.76it/s] 66%|██████▌   | 449/684 [00:35<00:17, 13.81it/s] 66%|██████▌   | 451/684 [00:35<00:16, 13.74it/s] 66%|██████▌   | 453/684 [00:35<00:16, 13.70it/s] 67%|██████▋   | 455/684 [00:35<00:16, 13.77it/s] 67%|██████▋   | 457/684 [00:37<01:18,  2.91it/s] 67%|██████▋   | 459/684 [00:37<00:59,  3.81it/s] 67%|██████▋   | 461/684 [00:37<00:45,  4.86it/s] 68%|██████▊   | 463/684 [00:37<00:36,  6.03it/s] 68%|██████▊   | 465/684 [00:38<00:30,  7.19it/s] 68%|██████▊   | 467/684 [00:38<00:26,  8.30it/s] 69%|██████▊   | 469/684 [00:38<00:23,  9.33it/s] 69%|██████▉   | 471/684 [00:38<00:20, 10.20it/s] 69%|██████▉   | 473/684 [00:38<00:19, 10.85it/s] 69%|██████▉   | 475/684 [00:38<00:18, 11.50it/s] 70%|██████▉   | 477/684 [00:38<00:17, 11.93it/s] 70%|███████   | 479/684 [00:39<00:17, 12.05it/s] 70%|███████   | 481/684 [00:39<00:16, 12.55it/s] 71%|███████   | 483/684 [00:39<00:16, 12.36it/s] 71%|███████   | 485/684 [00:39<00:15, 12.48it/s] 71%|███████   | 487/684 [00:39<00:15, 12.49it/s] 71%|███████▏  | 489/684 [00:39<00:15, 12.58it/s] 72%|███████▏  | 491/684 [00:40<00:15, 12.70it/s] 72%|███████▏  | 493/684 [00:40<00:15, 12.71it/s] 72%|███████▏  | 495/684 [00:40<00:14, 12.78it/s] 73%|███████▎  | 497/684 [00:40<00:14, 12.88it/s] 73%|███████▎  | 499/684 [00:40<00:14, 12.73it/s]                                                  73%|███████▎  | 500/684 [00:40<00:14, 12.73it/s] 73%|███████▎  | 501/684 [00:40<00:13, 13.09it/s] 74%|███████▎  | 503/684 [00:41<00:14, 12.87it/s] 74%|███████▍  | 505/684 [00:41<00:13, 13.08it/s] 74%|███████▍  | 507/684 [00:41<00:13, 12.80it/s] 74%|███████▍  | 509/684 [00:41<00:13, 13.04it/s] 75%|███████▍  | 511/684 [00:41<00:13, 13.29it/s] 75%|███████▌  | 513/684 [00:41<00:13, 12.89it/s] 75%|███████▌  | 515/684 [00:41<00:12, 13.03it/s] 76%|███████▌  | 517/684 [00:42<00:13, 12.60it/s] 76%|███████▌  | 519/684 [00:42<00:12, 12.92it/s] 76%|███████▌  | 521/684 [00:42<00:12, 12.60it/s] 76%|███████▋  | 523/684 [00:42<00:12, 12.93it/s] 77%|███████▋  | 525/684 [00:42<00:12, 12.59it/s] 77%|███████▋  | 527/684 [00:42<00:12, 12.98it/s] 77%|███████▋  | 529/684 [00:43<00:12, 12.60it/s] 78%|███████▊  | 531/684 [00:43<00:11, 12.99it/s] 78%|███████▊  | 533/684 [00:43<00:11, 12.59it/s] 78%|███████▊  | 535/684 [00:43<00:11, 12.73it/s] 79%|███████▊  | 537/684 [00:43<00:11, 12.56it/s] 79%|███████▉  | 539/684 [00:43<00:11, 12.79it/s] 79%|███████▉  | 541/684 [00:44<00:11, 12.49it/s] 79%|███████▉  | 543/684 [00:44<00:11, 12.65it/s] 80%|███████▉  | 545/684 [00:44<00:10, 12.80it/s] 80%|███████▉  | 547/684 [00:44<00:10, 12.86it/s] 80%|████████  | 549/684 [00:44<00:10, 13.07it/s] 81%|████████  | 551/684 [00:44<00:10, 13.23it/s] 81%|████████  | 553/684 [00:44<00:09, 13.39it/s] 81%|████████  | 555/684 [00:45<00:09, 13.56it/s] 81%|████████▏ | 557/684 [00:45<00:09, 13.64it/s] 82%|████████▏ | 559/684 [00:45<00:09, 13.67it/s] 82%|████████▏ | 561/684 [00:45<00:08, 13.70it/s] 82%|████████▏ | 563/684 [00:45<00:08, 13.78it/s] 83%|████████▎ | 565/684 [00:45<00:08, 13.78it/s] 83%|████████▎ | 567/684 [00:45<00:08, 13.67it/s] 83%|████████▎ | 569/684 [00:46<00:08, 13.68it/s] 83%|████████▎ | 571/684 [00:46<00:08, 13.72it/s] 84%|████████▍ | 573/684 [00:46<00:08, 13.73it/s] 84%|████████▍ | 575/684 [00:46<00:07, 13.76it/s] 84%|████████▍ | 577/684 [00:46<00:07, 13.73it/s] 85%|████████▍ | 579/684 [00:46<00:07, 13.74it/s] 85%|████████▍ | 581/684 [00:46<00:07, 13.78it/s] 85%|████████▌ | 583/684 [00:47<00:07, 13.78it/s] 86%|████████▌ | 585/684 [00:47<00:07, 13.77it/s] 86%|████████▌ | 587/684 [00:47<00:07, 13.70it/s] 86%|████████▌ | 589/684 [00:47<00:06, 13.74it/s] 86%|████████▋ | 591/684 [00:47<00:06, 13.73it/s] 87%|████████▋ | 593/684 [00:47<00:06, 13.75it/s] 87%|████████▋ | 595/684 [00:47<00:06, 13.75it/s] 87%|████████▋ | 597/684 [00:48<00:06, 13.75it/s] 88%|████████▊ | 599/684 [00:48<00:06, 13.74it/s] 88%|████████▊ | 601/684 [00:48<00:06, 13.75it/s] 88%|████████▊ | 603/684 [00:48<00:05, 13.75it/s] 88%|████████▊ | 605/684 [00:48<00:05, 13.72it/s] 89%|████████▊ | 607/684 [00:48<00:05, 13.73it/s] 89%|████████▉ | 609/684 [00:48<00:05, 13.74it/s] 89%|████████▉ | 611/684 [00:49<00:05, 13.70it/s] 90%|████████▉ | 613/684 [00:49<00:05, 13.71it/s] 90%|████████▉ | 615/684 [00:49<00:05, 13.70it/s] 90%|█████████ | 617/684 [00:49<00:04, 13.73it/s] 90%|█████████ | 619/684 [00:49<00:04, 13.71it/s] 91%|█████████ | 621/684 [00:49<00:04, 13.67it/s] 91%|█████████ | 623/684 [00:49<00:04, 13.70it/s] 91%|█████████▏| 625/684 [00:50<00:04, 13.70it/s] 92%|█████████▏| 627/684 [00:50<00:04, 13.73it/s] 92%|█████████▏| 629/684 [00:50<00:04, 13.72it/s] 92%|█████████▏| 631/684 [00:50<00:03, 13.71it/s] 93%|█████████▎| 633/684 [00:50<00:03, 13.75it/s] 93%|█████████▎| 635/684 [00:50<00:03, 13.75it/s] 93%|█████████▎| 637/684 [00:51<00:03, 13.78it/s] 93%|█████████▎| 639/684 [00:51<00:03, 13.74it/s] 94%|█████████▎| 641/684 [00:51<00:03, 13.81it/s] 94%|█████████▍| 643/684 [00:51<00:02, 13.77it/s] 94%|█████████▍| 645/684 [00:51<00:02, 13.75it/s] 95%|█████████▍| 647/684 [00:51<00:02, 13.77it/s] 95%|█████████▍| 649/684 [00:51<00:02, 13.76it/s] 95%|█████████▌| 651/684 [00:52<00:02, 13.76it/s] 95%|█████████▌| 653/684 [00:52<00:02, 13.74it/s] 96%|█████████▌| 655/684 [00:52<00:02, 13.80it/s] 96%|█████████▌| 657/684 [00:52<00:01, 13.76it/s] 96%|█████████▋| 659/684 [00:52<00:01, 13.79it/s] 97%|█████████▋| 661/684 [00:52<00:01, 13.75it/s] 97%|█████████▋| 663/684 [00:52<00:01, 13.73it/s] 97%|█████████▋| 665/684 [00:53<00:01, 13.81it/s] 98%|█████████▊| 667/684 [00:53<00:01, 13.73it/s] 98%|█████████▊| 669/684 [00:53<00:01, 13.74it/s] 98%|█████████▊| 671/684 [00:53<00:00, 13.75it/s] 98%|█████████▊| 673/684 [00:53<00:00, 13.75it/s] 99%|█████████▊| 675/684 [00:53<00:00, 13.71it/s] 99%|█████████▉| 677/684 [00:53<00:00, 13.75it/s] 99%|█████████▉| 679/684 [00:54<00:00, 13.77it/s]100%|█████████▉| 681/684 [00:54<00:00, 13.77it/s]100%|█████████▉| 683/684 [00:54<00:00, 13.75it/s]                                                 100%|██████████| 684/684 [00:56<00:00, 13.75it/s]100%|██████████| 684/684 [00:56<00:00, 12.13it/s]
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:31,  2.23s/it] 19%|█▉        | 3/16 [00:08<00:41,  3.16s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.65s/it] 31%|███▏      | 5/16 [00:17<00:43,  3.93s/it] 38%|███▊      | 6/16 [00:22<00:41,  4.11s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.22s/it] 50%|█████     | 8/16 [00:31<00:34,  4.29s/it] 56%|█████▋    | 9/16 [00:35<00:30,  4.34s/it] 62%|██████▎   | 10/16 [00:40<00:26,  4.38s/it] 69%|██████▉   | 11/16 [00:44<00:22,  4.41s/it] 75%|███████▌  | 12/16 [00:49<00:17,  4.42s/it] 81%|████████▏ | 13/16 [00:53<00:13,  4.43s/it] 88%|████████▊ | 14/16 [00:58<00:08,  4.45s/it] 94%|█████████▍| 15/16 [01:02<00:04,  4.45s/it]100%|██████████| 16/16 [01:05<00:00,  4.06s/it]100%|██████████| 16/16 [01:05<00:00,  4.12s/it]
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_errors.py", line 261, in hf_raise_for_status
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/requests/models.py", line 1021, in raise_for_status
-    raise HTTPError(http_error_msg, response=self)
-requests.exceptions.HTTPError: 404 Client Error: Not Found for url: https://huggingface.co/aatherton2024/eng-nah-svo-cpt/resolve/main/config.json
-
-The above exception was the direct cause of the following exception:
-
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/utils/hub.py", line 428, in cached_file
-    resolved_file = hf_hub_download(
-                    ^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_validators.py", line 118, in _inner_fn
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/file_download.py", line 1230, in hf_hub_download
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_validators.py", line 118, in _inner_fn
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/file_download.py", line 1606, in get_hf_file_metadata
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_errors.py", line 271, in hf_raise_for_status
-huggingface_hub.utils._errors.EntryNotFoundError: 404 Client Error. (Request ID: Root=1-650786ae-6603d136738db081161c4861;1f95ec5e-e41f-4227-9312-c914e4df78c5)
-
-Entry Not Found for url: https://huggingface.co/aatherton2024/eng-nah-svo-cpt/resolve/main/config.json.
-
-The above exception was the direct cause of the following exception:
-
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 152, in <module>
-    model = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint)
-            ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/auto/auto_factory.py", line 482, in from_pretrained
-    config, kwargs = AutoConfig.from_pretrained(
-                     ^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/auto/configuration_auto.py", line 1007, in from_pretrained
-    config_dict, unused_kwargs = PretrainedConfig.get_config_dict(pretrained_model_name_or_path, **kwargs)
-                                 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/configuration_utils.py", line 620, in get_config_dict
-    config_dict, kwargs = cls._get_config_dict(pretrained_model_name_or_path, **kwargs)
-                          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/configuration_utils.py", line 675, in _get_config_dict
-    resolved_config_file = cached_file(
-                           ^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/utils/hub.py", line 479, in cached_file
-    raise EnvironmentError(
-OSError: aatherton2024/eng-nah-svo-cpt does not appear to have a file named config.json. Checkout 'https://huggingface.co/aatherton2024/eng-nah-svo-cpt/main' for available files.
diff --git a/myerrors_1556.out b/myerrors_1556.out
deleted file mode 100644
index a2a0dbf83f155ceaa5d8b2e02eee98ac9c32aab9..0000000000000000000000000000000000000000
--- a/myerrors_1556.out
+++ /dev/null
@@ -1,22 +0,0 @@
-Map:   0%|          | 0/7292 [00:00<?, ? examples/s]Map:  27%|██▋       | 2000/7292 [00:00<00:00, 8595.22 examples/s]Map:  82%|████████▏ | 6000/7292 [00:00<00:00, 18512.49 examples/s]Map: 100%|██████████| 7292/7292 [00:00<00:00, 18090.23 examples/s]
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 31688.93 examples/s]
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 30340.57 examples/s]
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 72, in <module>
-    model = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint)
-            ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/auto/auto_factory.py", line 482, in from_pretrained
-    config, kwargs = AutoConfig.from_pretrained(
-                     ^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/auto/configuration_auto.py", line 1007, in from_pretrained
-    config_dict, unused_kwargs = PretrainedConfig.get_config_dict(pretrained_model_name_or_path, **kwargs)
-                                 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/configuration_utils.py", line 620, in get_config_dict
-    config_dict, kwargs = cls._get_config_dict(pretrained_model_name_or_path, **kwargs)
-                          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/configuration_utils.py", line 675, in _get_config_dict
-    resolved_config_file = cached_file(
-                           ^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/utils/hub.py", line 399, in cached_file
-    raise EnvironmentError(
-OSError: eng-nah-svo-cpt does not appear to have a file named config.json. Checkout 'https://huggingface.co/eng-nah-svo-cpt/None' for available files.
diff --git a/myerrors_1557.out b/myerrors_1557.out
deleted file mode 100644
index c521abbc5051a589ac5f4c325089c8f44a320fe2..0000000000000000000000000000000000000000
--- a/myerrors_1557.out
+++ /dev/null
@@ -1,40 +0,0 @@
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_errors.py", line 261, in hf_raise_for_status
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/requests/models.py", line 1021, in raise_for_status
-    raise HTTPError(http_error_msg, response=self)
-requests.exceptions.HTTPError: 404 Client Error: Not Found for url: https://huggingface.co/eng-nah-svo-cpt/resolve/main/tokenizer_config.json
-
-The above exception was the direct cause of the following exception:
-
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/utils/hub.py", line 428, in cached_file
-    resolved_file = hf_hub_download(
-                    ^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_validators.py", line 118, in _inner_fn
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/file_download.py", line 1344, in hf_hub_download
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/file_download.py", line 1230, in hf_hub_download
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_validators.py", line 118, in _inner_fn
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/file_download.py", line 1606, in get_hf_file_metadata
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_errors.py", line 293, in hf_raise_for_status
-huggingface_hub.utils._errors.RepositoryNotFoundError: 404 Client Error. (Request ID: Root=1-65078ad3-69f0105f790b8b472eceb3d6;305708a1-7612-4fce-92cd-fb302d6700cd)
-
-Repository Not Found for url: https://huggingface.co/eng-nah-svo-cpt/resolve/main/tokenizer_config.json.
-Please make sure you specified the correct `repo_id` and `repo_type`.
-If you are trying to access a private or gated repo, make sure you are authenticated.
-
-The above exception was the direct cause of the following exception:
-
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 40, in <module>
-    tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
-                ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/auto/tokenization_auto.py", line 677, in from_pretrained
-    tokenizer_config = get_tokenizer_config(pretrained_model_name_or_path, **kwargs)
-                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/auto/tokenization_auto.py", line 510, in get_tokenizer_config
-    resolved_config_file = cached_file(
-                           ^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/utils/hub.py", line 449, in cached_file
-    raise EnvironmentError(
-OSError: eng-nah-svo-cpt is not a local folder and is not a valid model identifier listed on 'https://huggingface.co/models'
-If this is a private repository, make sure to pass a token having permission to this repo either by logging in with `huggingface-cli login` or by passing `token=<your_token>`
diff --git a/myerrors_1558.out b/myerrors_1558.out
deleted file mode 100644
index ab4f661fb27c4a7ed0f771d2bb1c996028dd1f35..0000000000000000000000000000000000000000
--- a/myerrors_1558.out
+++ /dev/null
@@ -1,101 +0,0 @@
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 20217.07 examples/s]
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [0,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [1,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [2,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [3,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [4,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [5,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [6,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [7,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [8,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [9,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [10,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [11,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [12,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [13,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [14,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [15,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [16,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [17,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [18,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [19,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [20,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [21,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [22,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [23,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [24,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [25,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [26,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [27,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [28,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [29,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [30,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-/opt/conda/conda-bld/pytorch_1682343995622/work/aten/src/ATen/native/cuda/Indexing.cu:1146: indexSelectLargeIndex: block: [237,0,0], thread: [31,0,0] Assertion `srcIndex < srcSelectDimSize` failed.
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 132, in <module>
-    trainer.evaluate(max_length=max_length)
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 159, in evaluate
-    return super().evaluate(eval_dataset, ignore_keys=ignore_keys, metric_key_prefix=metric_key_prefix)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 2972, in evaluate
-    output = eval_loop(
-             ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer.py", line 3161, in evaluation_loop
-    loss, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
-                           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/trainer_seq2seq.py", line 282, in prediction_step
-    generated_tokens = self.model.generate(**inputs, **gen_kwargs)
-                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 1596, in generate
-    return self.greedy_search(
-           ^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/generation/utils.py", line 2444, in greedy_search
-    outputs = self(
-              ^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 1235, in forward
-    outputs = self.bert(
-              ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 1022, in forward
-    encoder_outputs = self.encoder(
-                      ^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 612, in forward
-    layer_outputs = layer_module(
-                    ^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 497, in forward
-    self_attention_outputs = self.attention(
-                             ^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 427, in forward
-    self_outputs = self.self(
-                   ^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/bert/modeling_bert.py", line 286, in forward
-    mixed_query_layer = self.query(hidden_states)
-                        ^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl
-    return forward_call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/nn/modules/linear.py", line 114, in forward
-    return F.linear(input, self.weight, self.bias)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-RuntimeError: CUDA error: CUBLAS_STATUS_NOT_INITIALIZED when calling `cublasCreate(handle)`
diff --git a/myerrors_1559.out b/myerrors_1559.out
deleted file mode 100644
index ee64d0e7b9593bf5b85acf9fa09650cd78c5d49b..0000000000000000000000000000000000000000
--- a/myerrors_1559.out
+++ /dev/null
@@ -1,3 +0,0 @@
-Map:   0%|          | 0/1001 [00:00<?, ? examples/s]Map: 100%|██████████| 1001/1001 [00:00<00:00, 15843.57 examples/s]
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:30,  2.17s/it] 19%|█▉        | 3/16 [00:08<00:39,  3.07s/it]slurmstepd-dl: error: *** JOB 1559 ON dl CANCELLED AT 2023-09-17T19:27:45 ***
diff --git a/myerrors_1560.out b/myerrors_1560.out
deleted file mode 100644
index 4d8f3d524e44a9718c338e0b0a80df3949b30d1d..0000000000000000000000000000000000000000
--- a/myerrors_1560.out
+++ /dev/null
@@ -1,2 +0,0 @@
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:31,  2.27s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.15s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.60s/it]slurmstepd-dl: error: *** JOB 1560 ON dl CANCELLED AT 2023-09-17T19:31:19 ***
diff --git a/myerrors_1561.out b/myerrors_1561.out
deleted file mode 100644
index 1ede688aefde0bc081e2d0c624f5bb8ee686bc43..0000000000000000000000000000000000000000
--- a/myerrors_1561.out
+++ /dev/null
@@ -1,161 +0,0 @@
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:31,  2.23s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.14s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.62s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.87s/it] 38%|███▊      | 6/16 [00:21<00:40,  4.03s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.13s/it] 50%|█████     | 8/16 [00:30<00:33,  4.20s/it] 56%|█████▋    | 9/16 [00:35<00:29,  4.24s/it] 62%|██████▎   | 10/16 [00:39<00:25,  4.29s/it] 69%|██████▉   | 11/16 [00:43<00:21,  4.31s/it] 75%|███████▌  | 12/16 [00:48<00:17,  4.32s/it] 81%|████████▏ | 13/16 [00:52<00:12,  4.33s/it] 88%|████████▊ | 14/16 [00:56<00:08,  4.33s/it] 94%|█████████▍| 15/16 [01:01<00:04,  4.34s/it]100%|██████████| 16/16 [01:04<00:00,  3.96s/it]100%|██████████| 16/16 [01:04<00:00,  4.03s/it]
-  0%|          | 0/684 [00:00<?, ?it/s]  0%|          | 1/684 [00:00<02:36,  4.35it/s]  0%|          | 3/684 [00:00<01:15,  9.01it/s]  1%|          | 5/684 [00:00<01:02, 10.94it/s]  1%|          | 7/684 [00:00<00:56, 12.01it/s]  1%|▏         | 9/684 [00:00<00:53, 12.63it/s]  2%|▏         | 11/684 [00:00<00:51, 13.00it/s]  2%|▏         | 13/684 [00:01<00:50, 13.29it/s]  2%|▏         | 15/684 [00:01<00:49, 13.50it/s]  2%|▏         | 17/684 [00:01<00:49, 13.57it/s]  3%|▎         | 19/684 [00:01<00:49, 13.57it/s]  3%|▎         | 21/684 [00:01<00:48, 13.63it/s]  3%|▎         | 23/684 [00:01<00:48, 13.61it/s]  4%|▎         | 25/684 [00:01<00:48, 13.70it/s]  4%|▍         | 27/684 [00:02<00:48, 13.68it/s]  4%|▍         | 29/684 [00:02<00:47, 13.73it/s]  5%|▍         | 31/684 [00:02<00:47, 13.70it/s]  5%|▍         | 33/684 [00:02<00:47, 13.70it/s]  5%|▌         | 35/684 [00:02<00:47, 13.74it/s]  5%|▌         | 37/684 [00:02<00:47, 13.71it/s]  6%|▌         | 39/684 [00:02<00:47, 13.71it/s]  6%|▌         | 41/684 [00:03<00:46, 13.75it/s]  6%|▋         | 43/684 [00:03<00:46, 13.73it/s]  7%|▋         | 45/684 [00:03<00:46, 13.73it/s]  7%|▋         | 47/684 [00:03<00:46, 13.74it/s]  7%|▋         | 49/684 [00:03<00:46, 13.77it/s]  7%|▋         | 51/684 [00:03<00:45, 13.77it/s]  8%|▊         | 53/684 [00:04<00:45, 13.76it/s]  8%|▊         | 55/684 [00:04<00:45, 13.76it/s]  8%|▊         | 57/684 [00:04<00:45, 13.72it/s]  9%|▊         | 59/684 [00:04<00:45, 13.69it/s]  9%|▉         | 61/684 [00:04<00:45, 13.70it/s]  9%|▉         | 63/684 [00:04<00:45, 13.70it/s] 10%|▉         | 65/684 [00:04<00:45, 13.74it/s] 10%|▉         | 67/684 [00:05<00:44, 13.71it/s] 10%|█         | 69/684 [00:05<00:44, 13.71it/s] 10%|█         | 71/684 [00:05<00:44, 13.69it/s] 11%|█         | 73/684 [00:05<00:44, 13.65it/s] 11%|█         | 75/684 [00:05<00:44, 13.70it/s] 11%|█▏        | 77/684 [00:05<00:44, 13.71it/s] 12%|█▏        | 79/684 [00:05<00:43, 13.75it/s] 12%|█▏        | 81/684 [00:06<00:43, 13.71it/s] 12%|█▏        | 83/684 [00:06<00:43, 13.76it/s] 12%|█▏        | 85/684 [00:06<00:43, 13.79it/s] 13%|█▎        | 87/684 [00:06<00:43, 13.75it/s] 13%|█▎        | 89/684 [00:06<00:43, 13.75it/s] 13%|█▎        | 91/684 [00:06<00:43, 13.79it/s] 14%|█▎        | 93/684 [00:06<00:43, 13.72it/s] 14%|█▍        | 95/684 [00:07<00:42, 13.77it/s] 14%|█▍        | 97/684 [00:07<00:42, 13.68it/s] 14%|█▍        | 99/684 [00:07<00:42, 13.73it/s] 15%|█▍        | 101/684 [00:07<00:42, 13.73it/s] 15%|█▌        | 103/684 [00:07<00:42, 13.73it/s] 15%|█▌        | 105/684 [00:07<00:42, 13.76it/s] 16%|█▌        | 107/684 [00:07<00:41, 13.76it/s] 16%|█▌        | 109/684 [00:08<00:41, 13.74it/s] 16%|█▌        | 111/684 [00:08<00:42, 13.58it/s] 17%|█▋        | 113/684 [00:08<00:41, 13.75it/s] 17%|█▋        | 115/684 [00:08<00:41, 13.78it/s] 17%|█▋        | 117/684 [00:08<00:41, 13.76it/s] 17%|█▋        | 119/684 [00:08<00:41, 13.75it/s] 18%|█▊        | 121/684 [00:08<00:41, 13.72it/s] 18%|█▊        | 123/684 [00:09<00:40, 13.76it/s] 18%|█▊        | 125/684 [00:09<00:40, 13.76it/s] 19%|█▊        | 127/684 [00:09<00:40, 13.75it/s] 19%|█▉        | 129/684 [00:09<00:40, 13.71it/s] 19%|█▉        | 131/684 [00:09<00:40, 13.80it/s] 19%|█▉        | 133/684 [00:09<00:39, 13.78it/s] 20%|█▉        | 135/684 [00:09<00:39, 13.76it/s] 20%|██        | 137/684 [00:10<00:39, 13.69it/s] 20%|██        | 139/684 [00:10<00:39, 13.73it/s] 21%|██        | 141/684 [00:10<00:39, 13.74it/s] 21%|██        | 143/684 [00:10<00:39, 13.68it/s] 21%|██        | 145/684 [00:10<00:39, 13.72it/s] 21%|██▏       | 147/684 [00:10<00:39, 13.68it/s] 22%|██▏       | 149/684 [00:10<00:38, 13.74it/s] 22%|██▏       | 151/684 [00:11<00:38, 13.74it/s] 22%|██▏       | 153/684 [00:11<00:38, 13.77it/s] 23%|██▎       | 155/684 [00:11<00:38, 13.72it/s] 23%|██▎       | 157/684 [00:11<00:38, 13.74it/s] 23%|██▎       | 159/684 [00:11<00:38, 13.75it/s] 24%|██▎       | 161/684 [00:11<00:37, 13.77it/s] 24%|██▍       | 163/684 [00:12<00:37, 13.74it/s] 24%|██▍       | 165/684 [00:12<00:37, 13.77it/s] 24%|██▍       | 167/684 [00:12<00:37, 13.77it/s] 25%|██▍       | 169/684 [00:12<00:37, 13.78it/s] 25%|██▌       | 171/684 [00:12<00:37, 13.80it/s] 25%|██▌       | 173/684 [00:12<00:37, 13.76it/s] 26%|██▌       | 175/684 [00:12<00:36, 13.78it/s] 26%|██▌       | 177/684 [00:13<00:36, 13.82it/s] 26%|██▌       | 179/684 [00:13<00:36, 13.78it/s] 26%|██▋       | 181/684 [00:13<00:36, 13.80it/s] 27%|██▋       | 183/684 [00:13<00:36, 13.74it/s] 27%|██▋       | 185/684 [00:13<00:36, 13.76it/s] 27%|██▋       | 187/684 [00:13<00:36, 13.73it/s] 28%|██▊       | 189/684 [00:13<00:35, 13.75it/s] 28%|██▊       | 191/684 [00:14<00:35, 13.76it/s] 28%|██▊       | 193/684 [00:14<00:35, 13.75it/s] 29%|██▊       | 195/684 [00:14<00:35, 13.76it/s] 29%|██▉       | 197/684 [00:14<00:35, 13.77it/s] 29%|██▉       | 199/684 [00:14<00:35, 13.77it/s] 29%|██▉       | 201/684 [00:14<00:35, 13.78it/s] 30%|██▉       | 203/684 [00:14<00:34, 13.79it/s] 30%|██▉       | 205/684 [00:15<00:34, 13.71it/s] 30%|███       | 207/684 [00:15<00:34, 13.73it/s] 31%|███       | 209/684 [00:15<00:34, 13.76it/s] 31%|███       | 211/684 [00:15<00:34, 13.69it/s] 31%|███       | 213/684 [00:15<00:34, 13.74it/s] 31%|███▏      | 215/684 [00:15<00:34, 13.71it/s] 32%|███▏      | 217/684 [00:15<00:34, 13.71it/s] 32%|███▏      | 219/684 [00:16<00:33, 13.76it/s] 32%|███▏      | 221/684 [00:16<00:34, 13.57it/s] 33%|███▎      | 223/684 [00:16<00:33, 13.77it/s] 33%|███▎      | 225/684 [00:16<00:33, 13.76it/s] 33%|███▎      | 227/684 [00:16<00:33, 13.77it/s] 33%|███▎      | 229/684 [00:19<03:03,  2.49it/s] 34%|███▍      | 231/684 [00:19<02:16,  3.33it/s] 34%|███▍      | 233/684 [00:19<01:43,  4.35it/s] 34%|███▍      | 235/684 [00:19<01:21,  5.48it/s] 35%|███▍      | 237/684 [00:19<01:06,  6.70it/s] 35%|███▍      | 239/684 [00:19<00:56,  7.87it/s] 35%|███▌      | 241/684 [00:19<00:50,  8.78it/s] 36%|███▌      | 243/684 [00:20<00:45,  9.63it/s] 36%|███▌      | 245/684 [00:20<00:42, 10.44it/s] 36%|███▌      | 247/684 [00:20<00:39, 10.97it/s] 36%|███▋      | 249/684 [00:20<00:37, 11.64it/s] 37%|███▋      | 251/684 [00:20<00:36, 11.91it/s] 37%|███▋      | 253/684 [00:20<00:34, 12.47it/s] 37%|███▋      | 255/684 [00:20<00:34, 12.58it/s] 38%|███▊      | 257/684 [00:21<00:33, 12.89it/s] 38%|███▊      | 259/684 [00:21<00:33, 12.81it/s] 38%|███▊      | 261/684 [00:21<00:32, 13.00it/s] 38%|███▊      | 263/684 [00:21<00:32, 13.01it/s] 39%|███▊      | 265/684 [00:21<00:31, 13.31it/s] 39%|███▉      | 267/684 [00:21<00:31, 13.04it/s] 39%|███▉      | 269/684 [00:22<00:31, 13.21it/s] 40%|███▉      | 271/684 [00:22<00:31, 12.98it/s] 40%|███▉      | 273/684 [00:22<00:31, 13.21it/s] 40%|████      | 275/684 [00:22<00:31, 13.04it/s] 40%|████      | 277/684 [00:22<00:30, 13.37it/s] 41%|████      | 279/684 [00:22<00:30, 13.21it/s] 41%|████      | 281/684 [00:22<00:31, 12.98it/s] 41%|████▏     | 283/684 [00:23<00:30, 12.99it/s] 42%|████▏     | 285/684 [00:23<00:31, 12.86it/s] 42%|████▏     | 287/684 [00:23<00:30, 13.02it/s] 42%|████▏     | 289/684 [00:23<00:30, 12.90it/s] 43%|████▎     | 291/684 [00:23<00:30, 13.07it/s] 43%|████▎     | 293/684 [00:23<00:29, 13.10it/s] 43%|████▎     | 295/684 [00:23<00:29, 13.24it/s] 43%|████▎     | 297/684 [00:24<00:29, 13.28it/s] 44%|████▎     | 299/684 [00:24<00:29, 13.25it/s] 44%|████▍     | 301/684 [00:24<00:29, 13.05it/s] 44%|████▍     | 303/684 [00:24<00:28, 13.17it/s] 45%|████▍     | 305/684 [00:24<00:29, 13.00it/s] 45%|████▍     | 307/684 [00:24<00:28, 13.16it/s] 45%|████▌     | 309/684 [00:25<00:28, 13.15it/s] 45%|████▌     | 311/684 [00:25<00:28, 13.09it/s] 46%|████▌     | 313/684 [00:25<00:27, 13.46it/s] 46%|████▌     | 315/684 [00:25<00:28, 13.14it/s] 46%|████▋     | 317/684 [00:25<00:28, 13.03it/s] 47%|████▋     | 319/684 [00:25<00:27, 13.29it/s] 47%|████▋     | 321/684 [00:25<00:27, 13.39it/s] 47%|████▋     | 323/684 [00:26<00:26, 13.64it/s] 48%|████▊     | 325/684 [00:26<00:26, 13.76it/s] 48%|████▊     | 327/684 [00:26<00:25, 13.84it/s] 48%|████▊     | 329/684 [00:26<00:25, 13.88it/s] 48%|████▊     | 331/684 [00:26<00:25, 13.94it/s] 49%|████▊     | 333/684 [00:26<00:25, 13.93it/s] 49%|████▉     | 335/684 [00:26<00:25, 13.92it/s] 49%|████▉     | 337/684 [00:27<00:24, 13.92it/s] 50%|████▉     | 339/684 [00:27<00:24, 13.90it/s] 50%|████▉     | 341/684 [00:27<00:24, 13.89it/s] 50%|█████     | 343/684 [00:27<00:24, 13.89it/s] 50%|█████     | 345/684 [00:27<00:24, 13.92it/s] 51%|█████     | 347/684 [00:27<00:24, 13.92it/s] 51%|█████     | 349/684 [00:27<00:24, 13.90it/s] 51%|█████▏    | 351/684 [00:28<00:23, 13.92it/s] 52%|█████▏    | 353/684 [00:28<00:23, 13.90it/s] 52%|█████▏    | 355/684 [00:28<00:23, 13.93it/s] 52%|█████▏    | 357/684 [00:28<00:23, 13.93it/s] 52%|█████▏    | 359/684 [00:28<00:23, 13.89it/s] 53%|█████▎    | 361/684 [00:28<00:23, 13.93it/s] 53%|█████▎    | 363/684 [00:28<00:23, 13.96it/s] 53%|█████▎    | 365/684 [00:29<00:22, 14.00it/s] 54%|█████▎    | 367/684 [00:29<00:22, 13.97it/s] 54%|█████▍    | 369/684 [00:29<00:22, 13.96it/s] 54%|█████▍    | 371/684 [00:29<00:22, 13.98it/s] 55%|█████▍    | 373/684 [00:29<00:22, 13.96it/s] 55%|█████▍    | 375/684 [00:29<00:22, 13.94it/s] 55%|█████▌    | 377/684 [00:29<00:22, 13.94it/s] 55%|█████▌    | 379/684 [00:30<00:21, 13.93it/s] 56%|█████▌    | 381/684 [00:30<00:21, 13.97it/s] 56%|█████▌    | 383/684 [00:30<00:21, 13.95it/s] 56%|█████▋    | 385/684 [00:30<00:21, 13.93it/s] 57%|█████▋    | 387/684 [00:30<00:21, 13.94it/s] 57%|█████▋    | 389/684 [00:30<00:21, 13.92it/s] 57%|█████▋    | 391/684 [00:30<00:21, 13.91it/s] 57%|█████▋    | 393/684 [00:31<00:20, 13.94it/s] 58%|█████▊    | 395/684 [00:31<00:20, 13.94it/s] 58%|█████▊    | 397/684 [00:31<00:20, 13.95it/s] 58%|█████▊    | 399/684 [00:31<00:20, 13.97it/s] 59%|█████▊    | 401/684 [00:31<00:20, 13.96it/s] 59%|█████▉    | 403/684 [00:31<00:20, 13.95it/s] 59%|█████▉    | 405/684 [00:31<00:20, 13.92it/s] 60%|█████▉    | 407/684 [00:32<00:19, 13.95it/s] 60%|█████▉    | 409/684 [00:32<00:19, 13.96it/s] 60%|██████    | 411/684 [00:32<00:19, 13.97it/s] 60%|██████    | 413/684 [00:32<00:19, 13.96it/s] 61%|██████    | 415/684 [00:32<00:19, 13.97it/s] 61%|██████    | 417/684 [00:32<00:19, 13.95it/s] 61%|██████▏   | 419/684 [00:32<00:18, 13.98it/s] 62%|██████▏   | 421/684 [00:33<00:18, 13.98it/s] 62%|██████▏   | 423/684 [00:33<00:18, 14.01it/s] 62%|██████▏   | 425/684 [00:33<00:18, 14.01it/s] 62%|██████▏   | 427/684 [00:33<00:18, 14.01it/s] 63%|██████▎   | 429/684 [00:33<00:18, 14.02it/s] 63%|██████▎   | 431/684 [00:33<00:18, 14.01it/s] 63%|██████▎   | 433/684 [00:33<00:17, 14.01it/s] 64%|██████▎   | 435/684 [00:34<00:17, 13.99it/s] 64%|██████▍   | 437/684 [00:34<00:17, 13.97it/s] 64%|██████▍   | 439/684 [00:34<00:17, 14.00it/s] 64%|██████▍   | 441/684 [00:34<00:17, 13.98it/s] 65%|██████▍   | 443/684 [00:34<00:17, 13.99it/s] 65%|██████▌   | 445/684 [00:34<00:17, 14.00it/s] 65%|██████▌   | 447/684 [00:34<00:16, 14.01it/s] 66%|██████▌   | 449/684 [00:35<00:16, 14.01it/s] 66%|██████▌   | 451/684 [00:35<00:16, 14.02it/s] 66%|██████▌   | 453/684 [00:35<00:16, 13.99it/s] 67%|██████▋   | 455/684 [00:35<00:16, 14.00it/s] 67%|██████▋   | 457/684 [00:38<01:45,  2.16it/s] 67%|██████▋   | 459/684 [00:38<01:17,  2.89it/s] 67%|██████▋   | 461/684 [00:38<00:58,  3.79it/s] 68%|██████▊   | 463/684 [00:38<00:45,  4.82it/s] 68%|██████▊   | 465/684 [00:38<00:37,  5.87it/s] 68%|██████▊   | 467/684 [00:39<00:31,  6.95it/s] 69%|██████▊   | 469/684 [00:39<00:27,  7.95it/s] 69%|██████▉   | 471/684 [00:39<00:24,  8.86it/s] 69%|██████▉   | 473/684 [00:39<00:21,  9.72it/s] 69%|██████▉   | 475/684 [00:39<00:20, 10.45it/s] 70%|██████▉   | 477/684 [00:39<00:18, 11.14it/s] 70%|███████   | 479/684 [00:40<00:17, 11.50it/s] 70%|███████   | 481/684 [00:40<00:16, 12.13it/s] 71%|███████   | 483/684 [00:40<00:16, 12.41it/s] 71%|███████   | 485/684 [00:40<00:15, 12.78it/s] 71%|███████   | 487/684 [00:40<00:15, 12.57it/s] 71%|███████▏  | 489/684 [00:40<00:15, 12.50it/s] 72%|███████▏  | 491/684 [00:40<00:14, 12.98it/s] 72%|███████▏  | 493/684 [00:41<00:14, 12.79it/s] 72%|███████▏  | 495/684 [00:41<00:14, 13.26it/s] 73%|███████▎  | 497/684 [00:41<00:14, 12.91it/s] 73%|███████▎  | 499/684 [00:41<00:14, 13.12it/s]                                                  73%|███████▎  | 500/684 [00:41<00:14, 13.12it/s] 73%|███████▎  | 501/684 [00:41<00:14, 12.84it/s] 74%|███████▎  | 503/684 [00:41<00:14, 12.80it/s] 74%|███████▍  | 505/684 [00:42<00:13, 12.84it/s] 74%|███████▍  | 507/684 [00:42<00:14, 12.49it/s] 74%|███████▍  | 509/684 [00:42<00:13, 12.92it/s] 75%|███████▍  | 511/684 [00:42<00:13, 12.59it/s] 75%|███████▌  | 513/684 [00:42<00:13, 12.52it/s] 75%|███████▌  | 515/684 [00:42<00:13, 12.82it/s] 76%|███████▌  | 517/684 [00:42<00:13, 12.62it/s] 76%|███████▌  | 519/684 [00:43<00:13, 12.46it/s] 76%|███████▌  | 521/684 [00:43<00:13, 12.47it/s] 76%|███████▋  | 523/684 [00:43<00:12, 12.43it/s] 77%|███████▋  | 525/684 [00:43<00:12, 12.42it/s] 77%|███████▋  | 527/684 [00:43<00:12, 12.23it/s] 77%|███████▋  | 529/684 [00:43<00:12, 12.67it/s] 78%|███████▊  | 531/684 [00:44<00:12, 12.63it/s] 78%|███████▊  | 533/684 [00:44<00:11, 13.03it/s] 78%|███████▊  | 535/684 [00:44<00:11, 13.21it/s] 79%|███████▊  | 537/684 [00:44<00:11, 13.19it/s] 79%|███████▉  | 539/684 [00:44<00:10, 13.54it/s] 79%|███████▉  | 541/684 [00:44<00:10, 13.65it/s] 79%|███████▉  | 543/684 [00:44<00:10, 13.71it/s] 80%|███████▉  | 545/684 [00:45<00:10, 13.73it/s] 80%|███████▉  | 547/684 [00:45<00:09, 13.74it/s] 80%|████████  | 549/684 [00:45<00:09, 13.76it/s] 81%|████████  | 551/684 [00:45<00:09, 13.79it/s] 81%|████████  | 553/684 [00:45<00:09, 13.78it/s] 81%|████████  | 555/684 [00:45<00:09, 13.78it/s] 81%|████████▏ | 557/684 [00:46<00:09, 13.79it/s] 82%|████████▏ | 559/684 [00:46<00:09, 13.82it/s] 82%|████████▏ | 561/684 [00:46<00:08, 13.77it/s] 82%|████████▏ | 563/684 [00:46<00:08, 13.84it/s] 83%|████████▎ | 565/684 [00:46<00:08, 13.79it/s] 83%|████████▎ | 567/684 [00:46<00:08, 13.80it/s] 83%|████████▎ | 569/684 [00:46<00:08, 13.82it/s] 83%|████████▎ | 571/684 [00:47<00:08, 13.76it/s] 84%|████████▍ | 573/684 [00:47<00:08, 13.70it/s] 84%|████████▍ | 575/684 [00:47<00:07, 13.65it/s] 84%|████████▍ | 577/684 [00:47<00:07, 13.65it/s] 85%|████████▍ | 579/684 [00:47<00:07, 13.62it/s] 85%|████████▍ | 581/684 [00:47<00:07, 13.52it/s] 85%|████████▌ | 583/684 [00:47<00:07, 13.44it/s] 86%|████████▌ | 585/684 [00:48<00:07, 13.53it/s] 86%|████████▌ | 587/684 [00:48<00:07, 13.52it/s] 86%|████████▌ | 589/684 [00:48<00:07, 13.50it/s] 86%|████████▋ | 591/684 [00:48<00:06, 13.44it/s] 87%|████████▋ | 593/684 [00:48<00:06, 13.53it/s] 87%|████████▋ | 595/684 [00:48<00:06, 13.67it/s] 87%|████████▋ | 597/684 [00:48<00:06, 13.64it/s] 88%|████████▊ | 599/684 [00:49<00:06, 13.68it/s] 88%|████████▊ | 601/684 [00:49<00:06, 13.68it/s] 88%|████████▊ | 603/684 [00:49<00:05, 13.73it/s] 88%|████████▊ | 605/684 [00:49<00:05, 13.71it/s] 89%|████████▊ | 607/684 [00:49<00:05, 13.74it/s] 89%|████████▉ | 609/684 [00:49<00:05, 13.79it/s] 89%|████████▉ | 611/684 [00:49<00:05, 13.74it/s] 90%|████████▉ | 613/684 [00:50<00:05, 13.73it/s] 90%|████████▉ | 615/684 [00:50<00:05, 13.74it/s] 90%|█████████ | 617/684 [00:50<00:04, 13.87it/s] 90%|█████████ | 619/684 [00:50<00:04, 13.93it/s] 91%|█████████ | 621/684 [00:50<00:04, 13.84it/s] 91%|█████████ | 623/684 [00:50<00:04, 13.82it/s] 91%|█████████▏| 625/684 [00:50<00:04, 13.86it/s] 92%|█████████▏| 627/684 [00:51<00:04, 13.80it/s] 92%|█████████▏| 629/684 [00:51<00:03, 13.84it/s] 92%|█████████▏| 631/684 [00:51<00:03, 13.79it/s] 93%|█████████▎| 633/684 [00:51<00:03, 13.77it/s] 93%|█████████▎| 635/684 [00:51<00:03, 13.75it/s] 93%|█████████▎| 637/684 [00:51<00:03, 13.74it/s] 93%|█████████▎| 639/684 [00:51<00:03, 13.77it/s] 94%|█████████▎| 641/684 [00:52<00:03, 13.73it/s] 94%|█████████▍| 643/684 [00:52<00:02, 13.68it/s] 94%|█████████▍| 645/684 [00:52<00:02, 13.70it/s] 95%|█████████▍| 647/684 [00:52<00:02, 13.74it/s] 95%|█████████▍| 649/684 [00:52<00:02, 13.74it/s] 95%|█████████▌| 651/684 [00:52<00:02, 13.76it/s] 95%|█████████▌| 653/684 [00:53<00:02, 13.74it/s] 96%|█████████▌| 655/684 [00:53<00:02, 13.73it/s] 96%|█████████▌| 657/684 [00:53<00:01, 13.71it/s] 96%|█████████▋| 659/684 [00:53<00:01, 13.75it/s] 97%|█████████▋| 661/684 [00:53<00:01, 13.71it/s] 97%|█████████▋| 663/684 [00:53<00:01, 13.71it/s] 97%|█████████▋| 665/684 [00:53<00:01, 13.72it/s] 98%|█████████▊| 667/684 [00:54<00:01, 13.74it/s] 98%|█████████▊| 669/684 [00:54<00:01, 13.85it/s] 98%|█████████▊| 671/684 [00:54<00:00, 13.80it/s] 98%|█████████▊| 673/684 [00:54<00:00, 13.78it/s] 99%|█████████▊| 675/684 [00:54<00:00, 13.76it/s] 99%|█████████▉| 677/684 [00:54<00:00, 13.79it/s] 99%|█████████▉| 679/684 [00:54<00:00, 13.78it/s]100%|█████████▉| 681/684 [00:55<00:00, 13.77it/s]100%|█████████▉| 683/684 [00:55<00:00, 13.80it/s]                                                 100%|██████████| 684/684 [00:57<00:00, 13.80it/s]100%|██████████| 684/684 [00:57<00:00, 11.86it/s]
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:30,  2.18s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.09s/it] 25%|██▌       | 4/16 [00:13<00:42,  3.55s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.83s/it] 38%|███▊      | 6/16 [00:21<00:40,  4.01s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.12s/it] 50%|█████     | 8/16 [00:30<00:33,  4.19s/it] 56%|█████▋    | 9/16 [00:34<00:29,  4.24s/it] 62%|██████▎   | 10/16 [00:39<00:25,  4.28s/it] 69%|██████▉   | 11/16 [00:43<00:21,  4.30s/it] 75%|███████▌  | 12/16 [00:47<00:17,  4.32s/it] 81%|████████▏ | 13/16 [00:52<00:12,  4.33s/it] 88%|████████▊ | 14/16 [00:56<00:08,  4.34s/it] 94%|█████████▍| 15/16 [01:00<00:04,  4.35s/it]100%|██████████| 16/16 [01:04<00:00,  3.97s/it]100%|██████████| 16/16 [01:04<00:00,  4.02s/it]
-/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/optimization.py:411: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning
-  warnings.warn(
-/mnt/storage/aatherton/hf_eng_fra_trans is already a clone of https://huggingface.co/aatherton2024/hf_eng_fra_trans. Make sure you pull the latest changes with `repo.git_pull()`.
-  0%|          | 0/2736 [00:00<?, ?it/s]  0%|          | 1/2736 [00:00<05:01,  9.08it/s]  0%|          | 3/2736 [00:00<04:14, 10.73it/s]  0%|          | 5/2736 [00:00<03:59, 11.40it/s]  0%|          | 7/2736 [00:00<03:56, 11.55it/s]  0%|          | 9/2736 [00:00<03:53, 11.66it/s]  0%|          | 11/2736 [00:00<03:53, 11.68it/s]  0%|          | 13/2736 [00:01<03:51, 11.76it/s]  1%|          | 15/2736 [00:01<03:51, 11.74it/s]  1%|          | 17/2736 [00:01<03:49, 11.84it/s]  1%|          | 19/2736 [00:01<03:49, 11.84it/s]  1%|          | 21/2736 [00:01<03:49, 11.84it/s]  1%|          | 23/2736 [00:01<03:50, 11.80it/s]  1%|          | 25/2736 [00:02<03:48, 11.85it/s]  1%|          | 27/2736 [00:02<03:46, 11.94it/s]  1%|          | 29/2736 [00:02<03:43, 12.11it/s]  1%|          | 31/2736 [00:02<03:41, 12.22it/s]  1%|          | 33/2736 [00:02<03:39, 12.32it/s]  1%|▏         | 35/2736 [00:02<03:37, 12.40it/s]  1%|▏         | 37/2736 [00:03<03:38, 12.38it/s]  1%|▏         | 39/2736 [00:03<03:36, 12.48it/s]  1%|▏         | 41/2736 [00:03<03:37, 12.40it/s]  2%|▏         | 43/2736 [00:03<03:35, 12.47it/s]  2%|▏         | 45/2736 [00:03<03:34, 12.52it/s]  2%|▏         | 47/2736 [00:03<03:34, 12.55it/s]  2%|▏         | 49/2736 [00:04<03:36, 12.42it/s]  2%|▏         | 51/2736 [00:04<03:35, 12.44it/s]  2%|▏         | 53/2736 [00:04<03:36, 12.40it/s]  2%|▏         | 55/2736 [00:04<03:35, 12.46it/s]  2%|▏         | 57/2736 [00:04<03:35, 12.44it/s]  2%|▏         | 59/2736 [00:04<03:34, 12.51it/s]  2%|▏         | 61/2736 [00:05<03:33, 12.53it/s]  2%|▏         | 63/2736 [00:05<03:34, 12.44it/s]  2%|▏         | 65/2736 [00:05<03:33, 12.49it/s]  2%|▏         | 67/2736 [00:05<03:35, 12.40it/s]  3%|▎         | 69/2736 [00:05<03:33, 12.48it/s]  3%|▎         | 71/2736 [00:05<03:32, 12.57it/s]  3%|▎         | 73/2736 [00:05<03:31, 12.59it/s]  3%|▎         | 75/2736 [00:06<03:30, 12.64it/s]  3%|▎         | 77/2736 [00:06<03:31, 12.59it/s]  3%|▎         | 79/2736 [00:06<03:30, 12.63it/s]  3%|▎         | 81/2736 [00:06<03:31, 12.57it/s]  3%|▎         | 83/2736 [00:06<03:31, 12.53it/s]  3%|▎         | 85/2736 [00:06<03:32, 12.45it/s]  3%|▎         | 87/2736 [00:07<03:31, 12.50it/s]  3%|▎         | 89/2736 [00:07<03:32, 12.45it/s]  3%|▎         | 91/2736 [00:07<03:32, 12.43it/s]  3%|▎         | 93/2736 [00:07<03:34, 12.35it/s]  3%|▎         | 95/2736 [00:07<03:34, 12.30it/s]  4%|▎         | 97/2736 [00:07<03:33, 12.38it/s]  4%|▎         | 99/2736 [00:08<03:34, 12.31it/s]  4%|▎         | 101/2736 [00:08<03:34, 12.28it/s]  4%|▍         | 103/2736 [00:08<03:33, 12.36it/s]  4%|▍         | 105/2736 [00:08<03:31, 12.46it/s]  4%|▍         | 107/2736 [00:08<03:29, 12.53it/s]  4%|▍         | 109/2736 [00:08<03:30, 12.50it/s]  4%|▍         | 111/2736 [00:09<03:29, 12.53it/s]  4%|▍         | 113/2736 [00:09<03:28, 12.57it/s]  4%|▍         | 115/2736 [00:09<03:29, 12.54it/s]  4%|▍         | 117/2736 [00:09<03:27, 12.62it/s]  4%|▍         | 119/2736 [00:09<03:27, 12.64it/s]  4%|▍         | 121/2736 [00:09<03:26, 12.64it/s]  4%|▍         | 123/2736 [00:09<03:26, 12.65it/s]  5%|▍         | 125/2736 [00:10<03:26, 12.64it/s]  5%|▍         | 127/2736 [00:10<03:27, 12.56it/s]  5%|▍         | 129/2736 [00:10<03:27, 12.57it/s]  5%|▍         | 131/2736 [00:10<03:28, 12.51it/s]  5%|▍         | 133/2736 [00:10<03:27, 12.52it/s]  5%|▍         | 135/2736 [00:10<03:29, 12.43it/s]  5%|▌         | 137/2736 [00:11<03:28, 12.48it/s]  5%|▌         | 139/2736 [00:11<03:29, 12.41it/s]  5%|▌         | 141/2736 [00:11<03:27, 12.52it/s]  5%|▌         | 143/2736 [00:11<03:27, 12.52it/s]  5%|▌         | 145/2736 [00:11<03:27, 12.47it/s]  5%|▌         | 147/2736 [00:11<03:26, 12.51it/s]  5%|▌         | 149/2736 [00:12<03:26, 12.53it/s]  6%|▌         | 151/2736 [00:12<03:27, 12.49it/s]  6%|▌         | 153/2736 [00:12<03:25, 12.54it/s]  6%|▌         | 155/2736 [00:12<03:25, 12.56it/s]  6%|▌         | 157/2736 [00:12<03:26, 12.49it/s]  6%|▌         | 159/2736 [00:12<03:25, 12.57it/s]  6%|▌         | 161/2736 [00:13<03:24, 12.58it/s]  6%|▌         | 163/2736 [00:13<03:25, 12.50it/s]  6%|▌         | 165/2736 [00:13<03:25, 12.49it/s]  6%|▌         | 167/2736 [00:13<03:25, 12.52it/s]  6%|▌         | 169/2736 [00:13<03:24, 12.54it/s]  6%|▋         | 171/2736 [00:13<03:24, 12.55it/s]  6%|▋         | 173/2736 [00:13<03:25, 12.47it/s]  6%|▋         | 175/2736 [00:14<03:24, 12.51it/s]  6%|▋         | 177/2736 [00:14<03:25, 12.43it/s]  7%|▋         | 179/2736 [00:14<03:24, 12.48it/s]  7%|▋         | 181/2736 [00:14<03:25, 12.41it/s]  7%|▋         | 183/2736 [00:14<03:24, 12.49it/s]  7%|▋         | 185/2736 [00:14<03:26, 12.35it/s]  7%|▋         | 187/2736 [00:15<03:26, 12.33it/s]  7%|▋         | 189/2736 [00:15<03:25, 12.41it/s]  7%|▋         | 191/2736 [00:15<03:24, 12.42it/s]  7%|▋         | 193/2736 [00:15<03:24, 12.46it/s]  7%|▋         | 195/2736 [00:15<03:23, 12.50it/s]  7%|▋         | 197/2736 [00:15<03:24, 12.42it/s]  7%|▋         | 199/2736 [00:16<03:23, 12.48it/s]  7%|▋         | 201/2736 [00:16<03:23, 12.47it/s]  7%|▋         | 203/2736 [00:16<03:22, 12.50it/s]  7%|▋         | 205/2736 [00:16<03:21, 12.59it/s]  8%|▊         | 207/2736 [00:16<03:22, 12.48it/s]  8%|▊         | 209/2736 [00:16<03:21, 12.54it/s]  8%|▊         | 211/2736 [00:17<03:21, 12.53it/s]  8%|▊         | 213/2736 [00:17<03:21, 12.51it/s]  8%|▊         | 215/2736 [00:17<03:22, 12.45it/s]  8%|▊         | 217/2736 [00:17<03:21, 12.50it/s]  8%|▊         | 219/2736 [00:17<03:20, 12.55it/s]  8%|▊         | 221/2736 [00:17<03:19, 12.60it/s]  8%|▊         | 223/2736 [00:17<03:21, 12.50it/s]  8%|▊         | 225/2736 [00:18<03:19, 12.58it/s]  8%|▊         | 227/2736 [00:18<03:19, 12.57it/s]  8%|▊         | 229/2736 [00:18<03:21, 12.47it/s]  8%|▊         | 231/2736 [00:18<03:19, 12.54it/s]  9%|▊         | 233/2736 [00:18<03:19, 12.56it/s]  9%|▊         | 235/2736 [00:18<03:19, 12.51it/s]  9%|▊         | 237/2736 [00:19<03:19, 12.52it/s]  9%|▊         | 239/2736 [00:19<03:18, 12.57it/s]  9%|▉         | 241/2736 [00:19<03:20, 12.47it/s]  9%|▉         | 243/2736 [00:19<03:19, 12.52it/s]  9%|▉         | 245/2736 [00:19<03:20, 12.45it/s]  9%|▉         | 247/2736 [00:19<03:18, 12.55it/s]  9%|▉         | 249/2736 [00:20<03:18, 12.55it/s]  9%|▉         | 251/2736 [00:20<03:18, 12.54it/s]  9%|▉         | 253/2736 [00:20<03:17, 12.56it/s]  9%|▉         | 255/2736 [00:20<03:17, 12.56it/s]  9%|▉         | 257/2736 [00:20<03:17, 12.58it/s]  9%|▉         | 259/2736 [00:20<03:17, 12.54it/s] 10%|▉         | 261/2736 [00:21<03:17, 12.52it/s] 10%|▉         | 263/2736 [00:21<03:17, 12.55it/s] 10%|▉         | 265/2736 [00:21<03:18, 12.44it/s] 10%|▉         | 267/2736 [00:21<03:17, 12.51it/s] 10%|▉         | 269/2736 [00:21<03:18, 12.41it/s] 10%|▉         | 271/2736 [00:21<03:17, 12.48it/s] 10%|▉         | 273/2736 [00:21<03:17, 12.48it/s] 10%|█         | 275/2736 [00:22<03:17, 12.43it/s] 10%|█         | 277/2736 [00:22<03:16, 12.51it/s] 10%|█         | 279/2736 [00:22<03:16, 12.50it/s] 10%|█         | 281/2736 [00:22<03:17, 12.44it/s] 10%|█         | 283/2736 [00:22<03:16, 12.48it/s] 10%|█         | 285/2736 [00:22<03:17, 12.43it/s] 10%|█         | 287/2736 [00:23<03:15, 12.50it/s] 11%|█         | 289/2736 [00:23<03:16, 12.43it/s] 11%|█         | 291/2736 [00:23<03:15, 12.53it/s] 11%|█         | 293/2736 [00:23<03:17, 12.38it/s] 11%|█         | 295/2736 [00:23<03:15, 12.47it/s] 11%|█         | 297/2736 [00:23<03:14, 12.51it/s] 11%|█         | 299/2736 [00:24<03:15, 12.50it/s] 11%|█         | 301/2736 [00:24<03:16, 12.39it/s] 11%|█         | 303/2736 [00:24<03:14, 12.50it/s] 11%|█         | 305/2736 [00:24<03:15, 12.45it/s] 11%|█         | 307/2736 [00:24<03:14, 12.47it/s] 11%|█▏        | 309/2736 [00:24<03:14, 12.50it/s] 11%|█▏        | 311/2736 [00:25<03:14, 12.47it/s] 11%|█▏        | 313/2736 [00:25<03:13, 12.50it/s] 12%|█▏        | 315/2736 [00:25<03:13, 12.49it/s] 12%|█▏        | 317/2736 [00:25<03:13, 12.49it/s] 12%|█▏        | 319/2736 [00:25<03:12, 12.55it/s] 12%|█▏        | 321/2736 [00:25<03:13, 12.45it/s] 12%|█▏        | 323/2736 [00:25<03:13, 12.48it/s] 12%|█▏        | 325/2736 [00:26<03:14, 12.38it/s] 12%|█▏        | 327/2736 [00:26<03:15, 12.33it/s] 12%|█▏        | 329/2736 [00:26<03:13, 12.44it/s] 12%|█▏        | 331/2736 [00:26<03:12, 12.49it/s] 12%|█▏        | 333/2736 [00:26<03:12, 12.46it/s] 12%|█▏        | 335/2736 [00:26<03:12, 12.45it/s] 12%|█▏        | 337/2736 [00:27<03:12, 12.49it/s] 12%|█▏        | 339/2736 [00:27<03:10, 12.56it/s] 12%|█▏        | 341/2736 [00:27<03:10, 12.57it/s] 13%|█▎        | 343/2736 [00:27<03:11, 12.50it/s] 13%|█▎        | 345/2736 [00:27<03:10, 12.55it/s] 13%|█▎        | 347/2736 [00:27<03:10, 12.57it/s] 13%|█▎        | 349/2736 [00:28<03:10, 12.50it/s] 13%|█▎        | 351/2736 [00:28<03:10, 12.54it/s] 13%|█▎        | 353/2736 [00:28<03:11, 12.46it/s] 13%|█▎        | 355/2736 [00:28<03:10, 12.53it/s] 13%|█▎        | 357/2736 [00:28<03:10, 12.49it/s] 13%|█▎        | 359/2736 [00:28<03:09, 12.57it/s] 13%|█▎        | 361/2736 [00:29<03:09, 12.53it/s] 13%|█▎        | 363/2736 [00:29<03:08, 12.57it/s] 13%|█▎        | 365/2736 [00:29<03:08, 12.57it/s] 13%|█▎        | 367/2736 [00:29<03:09, 12.49it/s] 13%|█▎        | 369/2736 [00:29<03:09, 12.52it/s] 14%|█▎        | 371/2736 [00:29<03:09, 12.49it/s] 14%|█▎        | 373/2736 [00:29<03:08, 12.51it/s] 14%|█▎        | 375/2736 [00:30<03:08, 12.55it/s] 14%|█▍        | 377/2736 [00:30<03:08, 12.50it/s] 14%|█▍        | 379/2736 [00:30<03:08, 12.47it/s] 14%|█▍        | 381/2736 [00:30<03:08, 12.51it/s] 14%|█▍        | 383/2736 [00:30<03:07, 12.58it/s] 14%|█▍        | 385/2736 [00:30<03:06, 12.58it/s] 14%|█▍        | 387/2736 [00:31<03:07, 12.51it/s] 14%|█▍        | 389/2736 [00:31<03:07, 12.55it/s] 14%|█▍        | 391/2736 [00:31<03:07, 12.53it/s] 14%|█▍        | 393/2736 [00:31<03:06, 12.54it/s] 14%|█▍        | 395/2736 [00:31<03:05, 12.60it/s] 15%|█▍        | 397/2736 [00:31<03:05, 12.60it/s] 15%|█▍        | 399/2736 [00:32<03:06, 12.56it/s] 15%|█▍        | 401/2736 [00:32<03:05, 12.57it/s] 15%|█▍        | 403/2736 [00:32<03:06, 12.53it/s] 15%|█▍        | 405/2736 [00:32<03:05, 12.54it/s] 15%|█▍        | 407/2736 [00:32<03:05, 12.57it/s] 15%|█▍        | 409/2736 [00:32<03:06, 12.50it/s] 15%|█▌        | 411/2736 [00:33<03:05, 12.55it/s] 15%|█▌        | 413/2736 [00:33<03:04, 12.60it/s] 15%|█▌        | 415/2736 [00:33<03:06, 12.45it/s] 15%|█▌        | 417/2736 [00:33<03:06, 12.40it/s] 15%|█▌        | 419/2736 [00:33<03:05, 12.46it/s] 15%|█▌        | 421/2736 [00:33<03:05, 12.50it/s] 15%|█▌        | 423/2736 [00:33<03:06, 12.41it/s] 16%|█▌        | 425/2736 [00:34<03:05, 12.46it/s] 16%|█▌        | 427/2736 [00:34<03:05, 12.41it/s] 16%|█▌        | 429/2736 [00:34<03:04, 12.48it/s] 16%|█▌        | 431/2736 [00:34<03:05, 12.40it/s] 16%|█▌        | 433/2736 [00:34<03:04, 12.49it/s] 16%|█▌        | 435/2736 [00:34<03:04, 12.47it/s] 16%|█▌        | 437/2736 [00:35<03:03, 12.51it/s] 16%|█▌        | 439/2736 [00:35<03:03, 12.53it/s] 16%|█▌        | 441/2736 [00:35<03:02, 12.54it/s] 16%|█▌        | 443/2736 [00:35<03:03, 12.48it/s] 16%|█▋        | 445/2736 [00:35<03:02, 12.55it/s] 16%|█▋        | 447/2736 [00:35<03:02, 12.54it/s] 16%|█▋        | 449/2736 [00:36<03:02, 12.50it/s] 16%|█▋        | 451/2736 [00:36<03:01, 12.56it/s] 17%|█▋        | 453/2736 [00:36<03:03, 12.46it/s] 17%|█▋        | 455/2736 [00:36<03:02, 12.51it/s] 17%|█▋        | 457/2736 [00:36<03:01, 12.53it/s] 17%|█▋        | 459/2736 [00:36<03:02, 12.48it/s] 17%|█▋        | 461/2736 [00:37<03:01, 12.52it/s] 17%|█▋        | 463/2736 [00:37<03:00, 12.57it/s] 17%|█▋        | 465/2736 [00:37<03:02, 12.48it/s] 17%|█▋        | 467/2736 [00:37<03:00, 12.56it/s] 17%|█▋        | 469/2736 [00:37<03:00, 12.55it/s] 17%|█▋        | 471/2736 [00:37<02:59, 12.62it/s] 17%|█▋        | 473/2736 [00:37<02:58, 12.65it/s] 17%|█▋        | 475/2736 [00:38<02:58, 12.69it/s] 17%|█▋        | 477/2736 [00:38<02:58, 12.64it/s] 18%|█▊        | 479/2736 [00:38<02:59, 12.56it/s] 18%|█▊        | 481/2736 [00:38<02:59, 12.55it/s] 18%|█▊        | 483/2736 [00:38<02:59, 12.55it/s] 18%|█▊        | 485/2736 [00:38<02:59, 12.57it/s] 18%|█▊        | 487/2736 [00:39<02:58, 12.60it/s] 18%|█▊        | 489/2736 [00:39<02:57, 12.63it/s] 18%|█▊        | 491/2736 [00:39<02:58, 12.56it/s] 18%|█▊        | 493/2736 [00:39<02:58, 12.55it/s] 18%|█▊        | 495/2736 [00:39<02:57, 12.60it/s] 18%|█▊        | 497/2736 [00:39<02:59, 12.48it/s] 18%|█▊        | 499/2736 [00:40<02:58, 12.56it/s] 18%|█▊        | 501/2736 [00:40<02:59, 12.44it/s] 18%|█▊        | 503/2736 [00:40<02:59, 12.44it/s] 18%|█▊        | 505/2736 [00:40<02:58, 12.48it/s] 19%|█▊        | 507/2736 [00:40<02:57, 12.53it/s] 19%|█▊        | 509/2736 [00:40<02:59, 12.38it/s] 19%|█▊        | 511/2736 [00:41<02:58, 12.44it/s] 19%|█▉        | 513/2736 [00:41<02:59, 12.42it/s] 19%|█▉        | 515/2736 [00:41<02:58, 12.44it/s] 19%|█▉        | 517/2736 [00:41<02:58, 12.41it/s] 19%|█▉        | 519/2736 [00:41<02:58, 12.40it/s] 19%|█▉        | 521/2736 [00:41<02:58, 12.44it/s] 19%|█▉        | 523/2736 [00:41<02:56, 12.52it/s] 19%|█▉        | 525/2736 [00:42<02:56, 12.54it/s] 19%|█▉        | 527/2736 [00:42<02:57, 12.46it/s] 19%|█▉        | 529/2736 [00:42<02:56, 12.54it/s] 19%|█▉        | 531/2736 [00:42<02:57, 12.45it/s] 19%|█▉        | 533/2736 [00:42<02:55, 12.52it/s] 20%|█▉        | 535/2736 [00:42<02:55, 12.55it/s] 20%|█▉        | 537/2736 [00:43<02:56, 12.48it/s] 20%|█▉        | 539/2736 [00:43<02:55, 12.53it/s] 20%|█▉        | 541/2736 [00:43<02:56, 12.46it/s] 20%|█▉        | 543/2736 [00:43<02:55, 12.52it/s] 20%|█▉        | 545/2736 [00:43<02:55, 12.46it/s] 20%|█▉        | 547/2736 [00:43<02:54, 12.54it/s] 20%|██        | 549/2736 [00:44<02:54, 12.53it/s] 20%|██        | 551/2736 [00:44<02:55, 12.48it/s] 20%|██        | 553/2736 [00:44<02:54, 12.48it/s] 20%|██        | 555/2736 [00:44<02:55, 12.42it/s] 20%|██        | 557/2736 [00:44<02:54, 12.51it/s] 20%|██        | 559/2736 [00:44<02:55, 12.44it/s] 21%|██        | 561/2736 [00:45<02:54, 12.49it/s] 21%|██        | 563/2736 [00:45<02:54, 12.42it/s] 21%|██        | 565/2736 [00:45<02:53, 12.50it/s] 21%|██        | 567/2736 [00:45<02:52, 12.57it/s] 21%|██        | 569/2736 [00:45<02:53, 12.52it/s] 21%|██        | 571/2736 [00:45<02:52, 12.53it/s] 21%|██        | 573/2736 [00:45<02:52, 12.52it/s] 21%|██        | 575/2736 [00:46<02:51, 12.62it/s] 21%|██        | 577/2736 [00:46<02:52, 12.52it/s] 21%|██        | 579/2736 [00:46<02:51, 12.56it/s] 21%|██        | 581/2736 [00:46<02:52, 12.46it/s] 21%|██▏       | 583/2736 [00:46<02:53, 12.44it/s] 21%|██▏       | 585/2736 [00:46<02:51, 12.51it/s] 21%|██▏       | 587/2736 [00:47<02:51, 12.52it/s] 22%|██▏       | 589/2736 [00:47<02:50, 12.59it/s] 22%|██▏       | 591/2736 [00:47<02:51, 12.49it/s] 22%|██▏       | 593/2736 [00:47<02:51, 12.53it/s] 22%|██▏       | 595/2736 [00:47<02:51, 12.46it/s] 22%|██▏       | 597/2736 [00:47<02:50, 12.52it/s] 22%|██▏       | 599/2736 [00:48<02:50, 12.52it/s] 22%|██▏       | 601/2736 [00:48<02:51, 12.46it/s] 22%|██▏       | 603/2736 [00:48<02:50, 12.51it/s] 22%|██▏       | 605/2736 [00:48<02:51, 12.46it/s] 22%|██▏       | 607/2736 [00:48<02:50, 12.52it/s] 22%|██▏       | 609/2736 [00:48<02:50, 12.48it/s] 22%|██▏       | 611/2736 [00:49<02:50, 12.49it/s] 22%|██▏       | 613/2736 [00:49<02:50, 12.42it/s] 22%|██▏       | 615/2736 [00:49<02:50, 12.47it/s] 23%|██▎       | 617/2736 [00:49<02:49, 12.52it/s] 23%|██▎       | 619/2736 [00:49<02:49, 12.47it/s] 23%|██▎       | 621/2736 [00:49<02:48, 12.53it/s] 23%|██▎       | 623/2736 [00:49<02:50, 12.43it/s] 23%|██▎       | 625/2736 [00:50<02:48, 12.51it/s] 23%|██▎       | 627/2736 [00:50<02:48, 12.53it/s] 23%|██▎       | 629/2736 [00:50<02:48, 12.47it/s] 23%|██▎       | 631/2736 [00:50<02:48, 12.51it/s] 23%|██▎       | 633/2736 [00:50<02:48, 12.47it/s] 23%|██▎       | 635/2736 [00:50<02:48, 12.45it/s] 23%|██▎       | 637/2736 [00:51<02:48, 12.47it/s] 23%|██▎       | 639/2736 [00:51<02:49, 12.40it/s] 23%|██▎       | 641/2736 [00:51<02:47, 12.49it/s] 24%|██▎       | 643/2736 [00:51<02:48, 12.44it/s] 24%|██▎       | 645/2736 [00:51<02:47, 12.49it/s] 24%|██▎       | 647/2736 [00:51<02:46, 12.54it/s] 24%|██▎       | 649/2736 [00:52<02:46, 12.50it/s] 24%|██▍       | 651/2736 [00:52<02:46, 12.56it/s] 24%|██▍       | 653/2736 [00:52<02:46, 12.54it/s] 24%|██▍       | 655/2736 [00:52<02:46, 12.49it/s] 24%|██▍       | 657/2736 [00:52<02:45, 12.54it/s] 24%|██▍       | 659/2736 [00:52<02:46, 12.45it/s] 24%|██▍       | 661/2736 [00:53<02:46, 12.50it/s] 24%|██▍       | 663/2736 [00:53<02:45, 12.53it/s] 24%|██▍       | 665/2736 [00:53<02:46, 12.46it/s] 24%|██▍       | 667/2736 [00:53<02:45, 12.53it/s] 24%|██▍       | 669/2736 [00:53<02:46, 12.44it/s] 25%|██▍       | 671/2736 [00:53<02:45, 12.50it/s] 25%|██▍       | 673/2736 [00:53<02:44, 12.55it/s] 25%|██▍       | 675/2736 [00:54<02:45, 12.47it/s] 25%|██▍       | 677/2736 [00:54<02:44, 12.51it/s] 25%|██▍       | 679/2736 [00:54<02:45, 12.45it/s] 25%|██▍       | 681/2736 [00:54<02:44, 12.53it/s] 25%|██▍       | 683/2736 [00:54<02:44, 12.45it/s] 25%|██▌       | 685/2736 [00:54<02:44, 12.51it/s] 25%|██▌       | 687/2736 [00:55<02:43, 12.50it/s] 25%|██▌       | 689/2736 [00:55<02:43, 12.50it/s] 25%|██▌       | 691/2736 [00:55<02:43, 12.53it/s] 25%|██▌       | 693/2736 [00:55<02:44, 12.46it/s] 25%|██▌       | 695/2736 [00:55<02:43, 12.51it/s] 25%|██▌       | 697/2736 [00:55<02:44, 12.43it/s] 26%|██▌       | 699/2736 [00:56<02:42, 12.52it/s] 26%|██▌       | 701/2736 [00:56<02:43, 12.44it/s] 26%|██▌       | 703/2736 [00:56<02:42, 12.54it/s] 26%|██▌       | 705/2736 [00:56<02:42, 12.50it/s] 26%|██▌       | 707/2736 [00:56<02:41, 12.53it/s] 26%|██▌       | 709/2736 [00:56<02:41, 12.58it/s] 26%|██▌       | 711/2736 [00:57<02:41, 12.55it/s] 26%|██▌       | 713/2736 [00:57<02:42, 12.49it/s] 26%|██▌       | 715/2736 [00:57<02:41, 12.52it/s] 26%|██▌       | 717/2736 [00:57<02:41, 12.47it/s] 26%|██▋       | 719/2736 [00:57<02:40, 12.55it/s] 26%|██▋       | 721/2736 [00:57<02:41, 12.47it/s] 26%|██▋       | 723/2736 [00:57<02:40, 12.53it/s] 26%|██▋       | 725/2736 [00:58<02:41, 12.46it/s] 27%|██▋       | 727/2736 [00:58<02:40, 12.52it/s] 27%|██▋       | 729/2736 [00:58<02:40, 12.49it/s] 27%|██▋       | 731/2736 [00:58<02:40, 12.52it/s] 27%|██▋       | 733/2736 [00:58<02:39, 12.58it/s] 27%|██▋       | 735/2736 [00:58<02:40, 12.49it/s] 27%|██▋       | 737/2736 [00:59<02:39, 12.53it/s] 27%|██▋       | 739/2736 [00:59<02:39, 12.55it/s] 27%|██▋       | 741/2736 [00:59<02:39, 12.50it/s] 27%|██▋       | 743/2736 [00:59<02:38, 12.56it/s] 27%|██▋       | 745/2736 [00:59<02:39, 12.51it/s] 27%|██▋       | 747/2736 [00:59<02:38, 12.52it/s] 27%|██▋       | 749/2736 [01:00<02:37, 12.59it/s] 27%|██▋       | 751/2736 [01:00<02:38, 12.54it/s] 28%|██▊       | 753/2736 [01:00<02:37, 12.59it/s] 28%|██▊       | 755/2736 [01:00<02:36, 12.62it/s] 28%|██▊       | 757/2736 [01:00<02:38, 12.51it/s] 28%|██▊       | 759/2736 [01:00<02:37, 12.55it/s] 28%|██▊       | 761/2736 [01:01<02:37, 12.52it/s] 28%|██▊       | 763/2736 [01:01<02:37, 12.57it/s] 28%|██▊       | 765/2736 [01:01<02:36, 12.61it/s] 28%|██▊       | 767/2736 [01:01<02:35, 12.63it/s] 28%|██▊       | 769/2736 [01:01<02:37, 12.50it/s] 28%|██▊       | 771/2736 [01:01<02:36, 12.58it/s] 28%|██▊       | 773/2736 [01:01<02:37, 12.50it/s] 28%|██▊       | 775/2736 [01:02<02:36, 12.55it/s] 28%|██▊       | 777/2736 [01:02<02:37, 12.42it/s] 28%|██▊       | 779/2736 [01:02<02:36, 12.51it/s] 29%|██▊       | 781/2736 [01:02<02:37, 12.44it/s] 29%|██▊       | 783/2736 [01:02<02:36, 12.51it/s] 29%|██▊       | 785/2736 [01:02<02:35, 12.56it/s] 29%|██▉       | 787/2736 [01:03<02:36, 12.49it/s] 29%|██▉       | 789/2736 [01:03<02:35, 12.50it/s] 29%|██▉       | 791/2736 [01:03<02:36, 12.43it/s] 29%|██▉       | 793/2736 [01:03<02:35, 12.51it/s] 29%|██▉       | 795/2736 [01:03<02:35, 12.44it/s] 29%|██▉       | 797/2736 [01:03<02:35, 12.49it/s] 29%|██▉       | 799/2736 [01:04<02:34, 12.56it/s] 29%|██▉       | 801/2736 [01:04<02:34, 12.49it/s] 29%|██▉       | 803/2736 [01:04<02:34, 12.54it/s] 29%|██▉       | 805/2736 [01:04<02:33, 12.55it/s] 29%|██▉       | 807/2736 [01:04<02:34, 12.49it/s] 30%|██▉       | 809/2736 [01:04<02:33, 12.57it/s] 30%|██▉       | 811/2736 [01:05<02:33, 12.53it/s] 30%|██▉       | 813/2736 [01:05<02:32, 12.59it/s] 30%|██▉       | 815/2736 [01:05<02:32, 12.58it/s] 30%|██▉       | 817/2736 [01:05<02:32, 12.59it/s] 30%|██▉       | 819/2736 [01:05<02:32, 12.53it/s] 30%|███       | 821/2736 [01:05<02:32, 12.54it/s] 30%|███       | 823/2736 [01:05<02:32, 12.58it/s] 30%|███       | 825/2736 [01:06<02:32, 12.52it/s] 30%|███       | 827/2736 [01:06<02:31, 12.56it/s] 30%|███       | 829/2736 [01:06<02:31, 12.60it/s] 30%|███       | 831/2736 [01:06<02:31, 12.58it/s] 30%|███       | 833/2736 [01:06<02:31, 12.59it/s] 31%|███       | 835/2736 [01:06<02:30, 12.62it/s] 31%|███       | 837/2736 [01:07<02:30, 12.63it/s] 31%|███       | 839/2736 [01:07<02:30, 12.61it/s] 31%|███       | 841/2736 [01:07<02:30, 12.60it/s] 31%|███       | 843/2736 [01:07<02:30, 12.57it/s] 31%|███       | 845/2736 [01:07<02:29, 12.62it/s] 31%|███       | 847/2736 [01:07<02:30, 12.53it/s] 31%|███       | 849/2736 [01:08<02:30, 12.52it/s] 31%|███       | 851/2736 [01:08<02:29, 12.59it/s] 31%|███       | 853/2736 [01:08<02:29, 12.58it/s] 31%|███▏      | 855/2736 [01:08<02:29, 12.60it/s] 31%|███▏      | 857/2736 [01:08<02:29, 12.61it/s] 31%|███▏      | 859/2736 [01:08<02:28, 12.61it/s] 31%|███▏      | 861/2736 [01:08<02:28, 12.62it/s] 32%|███▏      | 863/2736 [01:09<02:29, 12.52it/s] 32%|███▏      | 865/2736 [01:09<02:29, 12.55it/s] 32%|███▏      | 867/2736 [01:09<02:29, 12.52it/s] 32%|███▏      | 869/2736 [01:09<02:28, 12.55it/s] 32%|███▏      | 871/2736 [01:09<02:28, 12.59it/s] 32%|███▏      | 873/2736 [01:09<02:29, 12.50it/s] 32%|███▏      | 875/2736 [01:10<02:27, 12.58it/s] 32%|███▏      | 877/2736 [01:10<02:28, 12.48it/s] 32%|███▏      | 879/2736 [01:10<02:28, 12.53it/s] 32%|███▏      | 881/2736 [01:10<02:29, 12.44it/s] 32%|███▏      | 883/2736 [01:10<02:28, 12.50it/s] 32%|███▏      | 885/2736 [01:10<02:27, 12.52it/s] 32%|███▏      | 887/2736 [01:11<02:28, 12.46it/s] 32%|███▏      | 889/2736 [01:11<02:27, 12.56it/s] 33%|███▎      | 891/2736 [01:11<02:27, 12.54it/s] 33%|███▎      | 893/2736 [01:11<02:27, 12.50it/s] 33%|███▎      | 895/2736 [01:11<02:26, 12.55it/s] 33%|███▎      | 897/2736 [01:11<02:26, 12.52it/s] 33%|███▎      | 899/2736 [01:12<02:26, 12.54it/s] 33%|███▎      | 901/2736 [01:12<02:25, 12.61it/s] 33%|███▎      | 903/2736 [01:12<02:26, 12.51it/s] 33%|███▎      | 905/2736 [01:12<02:26, 12.53it/s] 33%|███▎      | 907/2736 [01:12<02:26, 12.51it/s] 33%|███▎      | 909/2736 [01:12<02:25, 12.53it/s] 33%|███▎      | 911/2736 [01:12<02:25, 12.57it/s]
-  0%|          | 0/126 [00:00<?, ?it/s][A
-  1%|          | 1/126 [00:01<02:48,  1.35s/it][A
-  2%|▏         | 2/126 [00:02<02:41,  1.30s/it][A
-  2%|▏         | 3/126 [00:03<02:36,  1.27s/it][A
-  3%|▎         | 4/126 [00:05<02:33,  1.26s/it][A
-  4%|▍         | 5/126 [00:06<02:31,  1.25s/it][A
-  5%|▍         | 6/126 [00:07<02:29,  1.24s/it][A
-  6%|▌         | 7/126 [00:08<02:27,  1.24s/it][A
-  6%|▋         | 8/126 [00:10<02:25,  1.24s/it][A
-  7%|▋         | 9/126 [00:11<02:24,  1.23s/it][A
-  8%|▊         | 10/126 [00:12<02:23,  1.23s/it][A
-  9%|▊         | 11/126 [00:13<02:21,  1.23s/it][A 33%|███▎      | 912/2736 [01:27<02:25, 12.57it/s]
- 10%|▉         | 12/126 [00:14<02:20,  1.23s/it][A
- 10%|█         | 13/126 [00:16<02:19,  1.23s/it][A
- 11%|█         | 14/126 [00:17<02:17,  1.23s/it][A
- 12%|█▏        | 15/126 [00:18<02:16,  1.23s/it][A
- 13%|█▎        | 16/126 [00:19<02:15,  1.23s/it][A
- 13%|█▎        | 17/126 [00:21<02:14,  1.23s/it][A
- 14%|█▍        | 18/126 [00:22<02:13,  1.23s/it][A
- 15%|█▌        | 19/126 [00:23<02:11,  1.23s/it][A
- 16%|█▌        | 20/126 [00:24<02:10,  1.23s/it][A
- 17%|█▋        | 21/126 [00:26<02:09,  1.23s/it][A
- 17%|█▋        | 22/126 [00:27<02:07,  1.23s/it][A
- 18%|█▊        | 23/126 [00:28<02:06,  1.23s/it][A
- 19%|█▉        | 24/126 [00:29<02:05,  1.23s/it][A
- 20%|█▉        | 25/126 [00:30<02:04,  1.23s/it][A
- 21%|██        | 26/126 [00:32<02:03,  1.23s/it][A
- 21%|██▏       | 27/126 [00:33<02:02,  1.23s/it][A
- 22%|██▏       | 28/126 [00:34<02:00,  1.23s/it][A
- 23%|██▎       | 29/126 [00:35<01:59,  1.23s/it][A
- 24%|██▍       | 30/126 [00:37<01:57,  1.23s/it][A
- 25%|██▍       | 31/126 [00:38<01:56,  1.23s/it][A
- 25%|██▌       | 32/126 [00:39<01:55,  1.23s/it][A
- 26%|██▌       | 33/126 [00:40<01:54,  1.23s/it][A
- 27%|██▋       | 34/126 [00:42<01:53,  1.23s/it][A
- 28%|██▊       | 35/126 [00:43<01:52,  1.23s/it][A
- 29%|██▊       | 36/126 [00:44<01:50,  1.23s/it][A
- 29%|██▉       | 37/126 [00:45<01:49,  1.23s/it][A
- 30%|███       | 38/126 [00:46<01:48,  1.23s/it][A
- 31%|███       | 39/126 [00:48<01:47,  1.24s/it][A
- 32%|███▏      | 40/126 [00:49<01:46,  1.24s/it][A
- 33%|███▎      | 41/126 [00:50<01:44,  1.24s/it][A
- 33%|███▎      | 42/126 [00:51<01:43,  1.23s/it][A
- 34%|███▍      | 43/126 [00:53<01:42,  1.23s/it][A
- 35%|███▍      | 44/126 [00:54<01:40,  1.23s/it][A
- 36%|███▌      | 45/126 [00:55<01:39,  1.23s/it][A
- 37%|███▋      | 46/126 [00:56<01:38,  1.23s/it][A
- 37%|███▋      | 47/126 [00:58<01:37,  1.23s/it][A
- 38%|███▊      | 48/126 [00:59<01:35,  1.23s/it][A
- 39%|███▉      | 49/126 [01:00<01:34,  1.23s/it][A
- 40%|███▉      | 50/126 [01:01<01:33,  1.23s/it][A
- 40%|████      | 51/126 [01:02<01:32,  1.23s/it][A
- 41%|████▏     | 52/126 [01:04<01:30,  1.23s/it][A
- 42%|████▏     | 53/126 [01:05<01:29,  1.23s/it][A
- 43%|████▎     | 54/126 [01:06<01:28,  1.23s/it][A
- 44%|████▎     | 55/126 [01:07<01:27,  1.23s/it][A
- 44%|████▍     | 56/126 [01:09<01:26,  1.23s/it][A
- 45%|████▌     | 57/126 [01:10<01:24,  1.23s/it][A
- 46%|████▌     | 58/126 [01:11<01:23,  1.23s/it][A
- 47%|████▋     | 59/126 [01:12<01:22,  1.23s/it][A
- 48%|████▊     | 60/126 [01:14<01:21,  1.23s/it][A
- 48%|████▊     | 61/126 [01:15<01:19,  1.23s/it][A
- 49%|████▉     | 62/126 [01:16<01:18,  1.23s/it][A
- 50%|█████     | 63/126 [01:17<01:17,  1.23s/it][A
- 51%|█████     | 64/126 [01:18<01:16,  1.23s/it][A
- 52%|█████▏    | 65/126 [01:20<01:14,  1.23s/it][A
- 52%|█████▏    | 66/126 [01:21<01:13,  1.23s/it][A
- 53%|█████▎    | 67/126 [01:22<01:12,  1.23s/it][A
- 54%|█████▍    | 68/126 [01:23<01:11,  1.23s/it][A
- 55%|█████▍    | 69/126 [01:25<01:10,  1.23s/it][A
- 56%|█████▌    | 70/126 [01:26<01:08,  1.23s/it][A
- 56%|█████▋    | 71/126 [01:27<01:07,  1.23s/it][A
- 57%|█████▋    | 72/126 [01:28<01:06,  1.23s/it][A
- 58%|█████▊    | 73/126 [01:30<01:05,  1.23s/it][A
- 59%|█████▊    | 74/126 [01:31<01:04,  1.23s/it][A
- 60%|█████▉    | 75/126 [01:32<01:02,  1.23s/it][A
- 60%|██████    | 76/126 [01:33<01:01,  1.23s/it][A
- 61%|██████    | 77/126 [01:34<01:00,  1.23s/it][A
- 62%|██████▏   | 78/126 [01:36<00:59,  1.23s/it][A
- 63%|██████▎   | 79/126 [01:37<00:57,  1.23s/it][A
- 63%|██████▎   | 80/126 [01:38<00:56,  1.23s/it][A
- 64%|██████▍   | 81/126 [01:39<00:55,  1.23s/it][A
- 65%|██████▌   | 82/126 [01:41<00:54,  1.23s/it][A
- 66%|██████▌   | 83/126 [01:42<00:52,  1.23s/it][A
- 67%|██████▋   | 84/126 [01:43<00:51,  1.23s/it][A
- 67%|██████▋   | 85/126 [01:44<00:50,  1.23s/it][A
- 68%|██████▊   | 86/126 [01:46<00:49,  1.23s/it][A
- 69%|██████▉   | 87/126 [01:47<00:47,  1.23s/it][A
- 70%|██████▉   | 88/126 [01:48<00:46,  1.23s/it][A
- 71%|███████   | 89/126 [01:49<00:45,  1.23s/it][A
- 71%|███████▏  | 90/126 [01:50<00:44,  1.23s/it][A
- 72%|███████▏  | 91/126 [01:52<00:43,  1.23s/it][A
- 73%|███████▎  | 92/126 [01:53<00:41,  1.23s/it][A
- 74%|███████▍  | 93/126 [01:54<00:40,  1.23s/it][A
- 75%|███████▍  | 94/126 [01:55<00:39,  1.23s/it][A
- 75%|███████▌  | 95/126 [01:57<00:38,  1.23s/it][A
- 76%|███████▌  | 96/126 [01:58<00:36,  1.23s/it][A
- 77%|███████▋  | 97/126 [01:59<00:35,  1.23s/it][A
- 78%|███████▊  | 98/126 [02:00<00:34,  1.23s/it][A
- 79%|███████▊  | 99/126 [02:02<00:33,  1.23s/it][A
- 79%|███████▉  | 100/126 [02:03<00:31,  1.23s/it][A
- 80%|████████  | 101/126 [02:04<00:30,  1.23s/it][A
- 81%|████████  | 102/126 [02:05<00:29,  1.23s/it][A
- 82%|████████▏ | 103/126 [02:06<00:28,  1.23s/it][A
- 83%|████████▎ | 104/126 [02:08<00:27,  1.23s/it][A
- 83%|████████▎ | 105/126 [02:09<00:25,  1.23s/it][A
- 84%|████████▍ | 106/126 [02:10<00:24,  1.23s/it][A
- 85%|████████▍ | 107/126 [02:11<00:23,  1.23s/it][A
- 86%|████████▌ | 108/126 [02:13<00:22,  1.23s/it][A
- 87%|████████▋ | 109/126 [02:14<00:20,  1.23s/it][A
- 87%|████████▋ | 110/126 [02:15<00:19,  1.23s/it][A
- 88%|████████▊ | 111/126 [02:16<00:18,  1.23s/it][A
- 89%|████████▉ | 112/126 [02:18<00:17,  1.23s/it][A
- 90%|████████▉ | 113/126 [02:19<00:16,  1.23s/it][A
- 90%|█████████ | 114/126 [02:20<00:14,  1.23s/it][A
- 91%|█████████▏| 115/126 [02:21<00:13,  1.23s/it][A
- 92%|█████████▏| 116/126 [02:22<00:12,  1.23s/it][A
- 93%|█████████▎| 117/126 [02:24<00:11,  1.23s/it][A
- 94%|█████████▎| 118/126 [02:25<00:09,  1.23s/it][A
- 94%|█████████▍| 119/126 [02:26<00:08,  1.23s/it][A
- 95%|█████████▌| 120/126 [02:27<00:07,  1.23s/it][A
- 96%|█████████▌| 121/126 [02:29<00:06,  1.23s/it][A
- 97%|█████████▋| 122/126 [02:30<00:04,  1.23s/it][A
- 98%|█████████▊| 123/126 [02:31<00:03,  1.23s/it][A
- 98%|█████████▊| 124/126 [02:32<00:02,  1.23s/it][A 98%|█████████▊| 124/126 [02:32<00:02,  1.23s/it]
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 219, in <module>
-    for batch in tqdm(eval_dataloader):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/tqdm/std.py", line 1178, in __iter__
-    for obj in iterable:
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/accelerate/data_loader.py", line 394, in __iter__
-    next_batch = next(dataloader_iter)
-                 ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 633, in __next__
-    data = self._next_data()
-           ^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 677, in _next_data
-    data = self._dataset_fetcher.fetch(index)  # may raise StopIteration
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/_utils/fetch.py", line 54, in fetch
-    return self.collate_fn(data)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/data/data_collator.py", line 600, in __call__
-    decoder_input_ids = self.model.prepare_decoder_input_ids_from_labels(labels=features["labels"])
-                        ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/marian/modeling_marian.py", line 1527, in prepare_decoder_input_ids_from_labels
-    return shift_tokens_right(labels, self.config.pad_token_id, self.config.decoder_start_token_id)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/marian/modeling_marian.py", line 66, in shift_tokens_right
-    shifted_input_ids[:, 0] = decoder_start_token_id
-    ~~~~~~~~~~~~~~~~~^^^^^^
-IndexError: index 0 is out of bounds for dimension 1 with size 0
- 33%|███▎      | 912/2736 [03:46<07:32,  4.03it/s]
diff --git a/myerrors_1562.out b/myerrors_1562.out
deleted file mode 100644
index 826ae5ca517836b878ef48a25bf7264e06a44b3b..0000000000000000000000000000000000000000
--- a/myerrors_1562.out
+++ /dev/null
@@ -1,8 +0,0 @@
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:30,  2.21s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.10s/it] 25%|██▌       | 4/16 [00:13<00:42,  3.55s/it] 31%|███▏      | 5/16 [00:17<00:41,  3.82s/it] 38%|███▊      | 6/16 [00:21<00:39,  3.98s/it] 44%|████▍     | 7/16 [00:26<00:36,  4.09s/it] 50%|█████     | 8/16 [00:30<00:33,  4.16s/it] 56%|█████▋    | 9/16 [00:34<00:29,  4.21s/it] 62%|██████▎   | 10/16 [00:38<00:25,  4.24s/it] 69%|██████▉   | 11/16 [00:43<00:21,  4.27s/it] 75%|███████▌  | 12/16 [00:47<00:17,  4.28s/it] 81%|████████▏ | 13/16 [00:51<00:12,  4.30s/it] 88%|████████▊ | 14/16 [00:56<00:08,  4.30s/it] 94%|█████████▍| 15/16 [01:00<00:04,  4.31s/it]100%|██████████| 16/16 [01:03<00:00,  3.93s/it]100%|██████████| 16/16 [01:03<00:00,  3.99s/it]
-  0%|          | 0/684 [00:00<?, ?it/s]  0%|          | 1/684 [00:00<02:35,  4.39it/s]  0%|          | 3/684 [00:00<01:18,  8.73it/s]  1%|          | 5/684 [00:00<01:03, 10.71it/s]  1%|          | 7/684 [00:00<00:57, 11.86it/s]  1%|▏         | 9/684 [00:00<00:53, 12.54it/s]  2%|▏         | 11/684 [00:00<00:52, 12.92it/s]  2%|▏         | 13/684 [00:01<00:50, 13.23it/s]  2%|▏         | 15/684 [00:01<00:50, 13.36it/s]  2%|▏         | 17/684 [00:01<00:49, 13.47it/s]  3%|▎         | 19/684 [00:01<00:48, 13.61it/s]  3%|▎         | 21/684 [00:01<00:48, 13.64it/s]  3%|▎         | 23/684 [00:01<00:48, 13.63it/s]  4%|▎         | 25/684 [00:01<00:48, 13.72it/s]  4%|▍         | 27/684 [00:02<00:47, 13.73it/s]  4%|▍         | 29/684 [00:02<00:47, 13.71it/s]  5%|▍         | 31/684 [00:02<00:47, 13.76it/s]  5%|▍         | 33/684 [00:02<00:47, 13.71it/s]  5%|▌         | 35/684 [00:02<00:47, 13.76it/s]  5%|▌         | 37/684 [00:02<00:47, 13.77it/s]  6%|▌         | 39/684 [00:02<00:46, 13.74it/s]  6%|▌         | 41/684 [00:03<00:46, 13.74it/s]  6%|▋         | 43/684 [00:03<00:46, 13.73it/s]  7%|▋         | 45/684 [00:03<00:46, 13.71it/s]  7%|▋         | 47/684 [00:03<00:46, 13.77it/s]  7%|▋         | 49/684 [00:03<00:46, 13.72it/s]  7%|▋         | 51/684 [00:03<00:46, 13.70it/s]  8%|▊         | 53/684 [00:04<00:45, 13.78it/s]  8%|▊         | 55/684 [00:04<00:45, 13.76it/s]  8%|▊         | 57/684 [00:04<00:45, 13.72it/s]  9%|▊         | 59/684 [00:04<00:45, 13.77it/s]  9%|▉         | 61/684 [00:04<00:45, 13.76it/s]  9%|▉         | 63/684 [00:04<00:45, 13.74it/s] 10%|▉         | 65/684 [00:04<00:44, 13.78it/s] 10%|▉         | 67/684 [00:05<00:44, 13.76it/s] 10%|█         | 69/684 [00:05<00:44, 13.74it/s] 10%|█         | 71/684 [00:05<00:44, 13.76it/s] 11%|█         | 73/684 [00:05<00:44, 13.78it/s] 11%|█         | 75/684 [00:05<00:44, 13.79it/s] 11%|█▏        | 77/684 [00:05<00:44, 13.78it/s] 12%|█▏        | 79/684 [00:05<00:44, 13.72it/s] 12%|█▏        | 81/684 [00:06<00:43, 13.78it/s] 12%|█▏        | 83/684 [00:06<00:43, 13.76it/s] 12%|█▏        | 85/684 [00:06<00:43, 13.73it/s] 13%|█▎        | 87/684 [00:06<00:43, 13.72it/s] 13%|█▎        | 89/684 [00:06<00:43, 13.74it/s] 13%|█▎        | 91/684 [00:06<00:43, 13.71it/s] 14%|█▎        | 93/684 [00:06<00:43, 13.72it/s] 14%|█▍        | 95/684 [00:07<00:42, 13.75it/s] 14%|█▍        | 97/684 [00:07<00:42, 13.78it/s] 14%|█▍        | 99/684 [00:07<00:42, 13.81it/s] 15%|█▍        | 101/684 [00:07<00:42, 13.81it/s] 15%|█▌        | 103/684 [00:07<00:42, 13.79it/s] 15%|█▌        | 105/684 [00:07<00:41, 13.79it/s] 16%|█▌        | 107/684 [00:07<00:41, 13.77it/s] 16%|█▌        | 109/684 [00:08<00:41, 13.80it/s] 16%|█▌        | 111/684 [00:08<00:41, 13.80it/s] 17%|█▋        | 113/684 [00:08<00:41, 13.78it/s] 17%|█▋        | 115/684 [00:08<00:41, 13.78it/s] 17%|█▋        | 117/684 [00:08<00:40, 13.83it/s] 17%|█▋        | 119/684 [00:08<00:41, 13.73it/s] 18%|█▊        | 121/684 [00:08<00:40, 13.75it/s] 18%|█▊        | 123/684 [00:09<00:40, 13.75it/s] 18%|█▊        | 125/684 [00:09<00:40, 13.76it/s] 19%|█▊        | 127/684 [00:09<00:40, 13.79it/s] 19%|█▉        | 129/684 [00:09<00:40, 13.76it/s] 19%|█▉        | 131/684 [00:09<00:40, 13.74it/s] 19%|█▉        | 133/684 [00:09<00:40, 13.73it/s] 20%|█▉        | 135/684 [00:09<00:40, 13.71it/s] 20%|██        | 137/684 [00:10<00:39, 13.69it/s] 20%|██        | 139/684 [00:10<00:39, 13.71it/s] 21%|██        | 141/684 [00:10<00:39, 13.72it/s] 21%|██        | 143/684 [00:10<00:39, 13.71it/s] 21%|██        | 145/684 [00:10<00:39, 13.72it/s] 21%|██▏       | 147/684 [00:10<00:39, 13.75it/s] 22%|██▏       | 149/684 [00:10<00:38, 13.86it/s] 22%|██▏       | 151/684 [00:11<00:38, 13.77it/s] 22%|██▏       | 153/684 [00:11<00:38, 13.82it/s] 23%|██▎       | 155/684 [00:11<00:38, 13.88it/s] 23%|██▎       | 157/684 [00:11<00:37, 13.99it/s] 23%|██▎       | 159/684 [00:11<00:37, 13.88it/s] 24%|██▎       | 161/684 [00:11<00:37, 13.85it/s] 24%|██▍       | 163/684 [00:12<00:37, 13.77it/s] 24%|██▍       | 165/684 [00:12<00:37, 13.71it/s] 24%|██▍       | 167/684 [00:12<00:37, 13.71it/s] 25%|██▍       | 169/684 [00:12<00:37, 13.78it/s] 25%|██▌       | 171/684 [00:12<00:37, 13.79it/s] 25%|██▌       | 173/684 [00:12<00:36, 13.82it/s] 26%|██▌       | 175/684 [00:12<00:36, 13.80it/s] 26%|██▌       | 177/684 [00:13<00:36, 13.77it/s] 26%|██▌       | 179/684 [00:13<00:36, 13.77it/s] 26%|██▋       | 181/684 [00:13<00:36, 13.78it/s] 27%|██▋       | 183/684 [00:13<00:36, 13.76it/s] 27%|██▋       | 185/684 [00:13<00:36, 13.76it/s] 27%|██▋       | 187/684 [00:13<00:36, 13.75it/s] 28%|██▊       | 189/684 [00:13<00:36, 13.75it/s] 28%|██▊       | 191/684 [00:14<00:35, 13.75it/s] 28%|██▊       | 193/684 [00:14<00:35, 13.76it/s] 29%|██▊       | 195/684 [00:14<00:35, 13.75it/s] 29%|██▉       | 197/684 [00:14<00:35, 13.76it/s] 29%|██▉       | 199/684 [00:14<00:35, 13.77it/s] 29%|██▉       | 201/684 [00:14<00:35, 13.78it/s] 30%|██▉       | 203/684 [00:14<00:34, 13.77it/s] 30%|██▉       | 205/684 [00:15<00:34, 13.75it/s] 30%|███       | 207/684 [00:15<00:34, 13.79it/s] 31%|███       | 209/684 [00:15<00:34, 13.77it/s] 31%|███       | 211/684 [00:15<00:34, 13.77it/s] 31%|███       | 213/684 [00:15<00:34, 13.78it/s] 31%|███▏      | 215/684 [00:15<00:34, 13.75it/s] 32%|███▏      | 217/684 [00:15<00:33, 13.85it/s] 32%|███▏      | 219/684 [00:16<00:33, 13.82it/s] 32%|███▏      | 221/684 [00:16<00:33, 13.77it/s] 33%|███▎      | 223/684 [00:16<00:33, 13.76it/s] 33%|███▎      | 225/684 [00:16<00:33, 13.76it/s] 33%|███▎      | 227/684 [00:16<00:33, 13.82it/s] 33%|███▎      | 229/684 [00:19<03:24,  2.22it/s] 34%|███▍      | 231/684 [00:19<02:32,  2.97it/s] 34%|███▍      | 233/684 [00:19<01:55,  3.90it/s] 34%|███▍      | 235/684 [00:19<01:30,  4.96it/s] 35%|███▍      | 237/684 [00:19<01:13,  6.09it/s] 35%|███▍      | 239/684 [00:20<01:01,  7.22it/s] 35%|███▌      | 241/684 [00:20<00:53,  8.22it/s] 36%|███▌      | 243/684 [00:20<00:47,  9.25it/s] 36%|███▌      | 245/684 [00:20<00:43, 10.11it/s] 36%|███▌      | 247/684 [00:20<00:40, 10.91it/s] 36%|███▋      | 249/684 [00:20<00:38, 11.29it/s] 37%|███▋      | 251/684 [00:20<00:36, 11.91it/s] 37%|███▋      | 253/684 [00:21<00:35, 12.08it/s] 37%|███▋      | 255/684 [00:21<00:34, 12.56it/s] 38%|███▊      | 257/684 [00:21<00:33, 12.63it/s] 38%|███▊      | 259/684 [00:21<00:32, 13.01it/s] 38%|███▊      | 261/684 [00:21<00:32, 12.92it/s] 38%|███▊      | 263/684 [00:21<00:31, 13.21it/s] 39%|███▊      | 265/684 [00:22<00:32, 12.93it/s] 39%|███▉      | 267/684 [00:22<00:31, 13.30it/s] 39%|███▉      | 269/684 [00:22<00:30, 13.51it/s] 40%|███▉      | 271/684 [00:22<00:31, 13.30it/s] 40%|███▉      | 273/684 [00:22<00:31, 13.14it/s] 40%|████      | 275/684 [00:22<00:30, 13.32it/s] 40%|████      | 277/684 [00:22<00:31, 12.97it/s] 41%|████      | 279/684 [00:23<00:31, 12.95it/s] 41%|████      | 281/684 [00:23<00:30, 13.06it/s] 41%|████▏     | 283/684 [00:23<00:30, 13.29it/s] 42%|████▏     | 285/684 [00:23<00:30, 13.09it/s] 42%|████▏     | 287/684 [00:23<00:29, 13.36it/s] 42%|████▏     | 289/684 [00:23<00:30, 13.13it/s] 43%|████▎     | 291/684 [00:24<00:30, 12.97it/s] 43%|████▎     | 293/684 [00:24<00:29, 13.22it/s] 43%|████▎     | 295/684 [00:24<00:29, 13.04it/s] 43%|████▎     | 297/684 [00:24<00:29, 13.11it/s] 44%|████▎     | 299/684 [00:24<00:29, 12.96it/s] 44%|████▍     | 301/684 [00:24<00:29, 13.16it/s] 44%|████▍     | 303/684 [00:24<00:28, 13.37it/s] 45%|████▍     | 305/684 [00:25<00:29, 12.93it/s] 45%|████▍     | 307/684 [00:25<00:29, 13.00it/s] 45%|████▌     | 309/684 [00:25<00:29, 12.85it/s] 45%|████▌     | 311/684 [00:25<00:29, 12.75it/s] 46%|████▌     | 313/684 [00:25<00:28, 13.03it/s] 46%|████▌     | 315/684 [00:25<00:28, 13.04it/s] 46%|████▋     | 317/684 [00:26<00:27, 13.17it/s] 47%|████▋     | 319/684 [00:26<00:27, 13.04it/s] 47%|████▋     | 321/684 [00:26<00:27, 13.27it/s] 47%|████▋     | 323/684 [00:26<00:27, 13.35it/s] 48%|████▊     | 325/684 [00:26<00:26, 13.48it/s] 48%|████▊     | 327/684 [00:26<00:26, 13.29it/s] 48%|████▊     | 329/684 [00:26<00:26, 13.34it/s] 48%|████▊     | 331/684 [00:27<00:26, 13.48it/s] 49%|████▊     | 333/684 [00:27<00:25, 13.58it/s] 49%|████▉     | 335/684 [00:27<00:25, 13.67it/s] 49%|████▉     | 337/684 [00:27<00:25, 13.71it/s] 50%|████▉     | 339/684 [00:27<00:25, 13.75it/s] 50%|████▉     | 341/684 [00:27<00:25, 13.70it/s] 50%|█████     | 343/684 [00:27<00:24, 13.71it/s] 50%|█████     | 345/684 [00:28<00:24, 13.73it/s] 51%|█████     | 347/684 [00:28<00:24, 13.72it/s] 51%|█████     | 349/684 [00:28<00:24, 13.71it/s] 51%|█████▏    | 351/684 [00:28<00:24, 13.70it/s] 52%|█████▏    | 353/684 [00:28<00:24, 13.72it/s] 52%|█████▏    | 355/684 [00:28<00:24, 13.70it/s] 52%|█████▏    | 357/684 [00:28<00:23, 13.74it/s] 52%|█████▏    | 359/684 [00:29<00:23, 13.74it/s] 53%|█████▎    | 361/684 [00:29<00:23, 13.73it/s] 53%|█████▎    | 363/684 [00:29<00:23, 13.71it/s] 53%|█████▎    | 365/684 [00:29<00:23, 13.73it/s] 54%|█████▎    | 367/684 [00:29<00:23, 13.74it/s] 54%|█████▍    | 369/684 [00:29<00:22, 13.72it/s] 54%|█████▍    | 371/684 [00:29<00:22, 13.74it/s] 55%|█████▍    | 373/684 [00:30<00:22, 13.80it/s] 55%|█████▍    | 375/684 [00:30<00:22, 13.88it/s] 55%|█████▌    | 377/684 [00:30<00:22, 13.93it/s] 55%|█████▌    | 379/684 [00:30<00:22, 13.82it/s] 56%|█████▌    | 381/684 [00:30<00:21, 13.79it/s] 56%|█████▌    | 383/684 [00:30<00:21, 13.77it/s] 56%|█████▋    | 385/684 [00:30<00:21, 13.74it/s] 57%|█████▋    | 387/684 [00:31<00:21, 13.74it/s] 57%|█████▋    | 389/684 [00:31<00:21, 13.75it/s] 57%|█████▋    | 391/684 [00:31<00:21, 13.74it/s] 57%|█████▋    | 393/684 [00:31<00:21, 13.69it/s] 58%|█████▊    | 395/684 [00:31<00:21, 13.75it/s] 58%|█████▊    | 397/684 [00:31<00:20, 13.74it/s] 58%|█████▊    | 399/684 [00:31<00:20, 13.68it/s] 59%|█████▊    | 401/684 [00:32<00:20, 13.69it/s] 59%|█████▉    | 403/684 [00:32<00:20, 13.70it/s] 59%|█████▉    | 405/684 [00:32<00:20, 13.74it/s] 60%|█████▉    | 407/684 [00:32<00:20, 13.73it/s] 60%|█████▉    | 409/684 [00:32<00:19, 13.77it/s] 60%|██████    | 411/684 [00:32<00:19, 13.87it/s] 60%|██████    | 413/684 [00:33<00:19, 13.96it/s] 61%|██████    | 415/684 [00:33<00:19, 13.95it/s] 61%|██████    | 417/684 [00:33<00:19, 13.88it/s] 61%|██████▏   | 419/684 [00:33<00:19, 13.86it/s] 62%|██████▏   | 421/684 [00:33<00:18, 14.00it/s] 62%|██████▏   | 423/684 [00:33<00:18, 13.99it/s] 62%|██████▏   | 425/684 [00:33<00:18, 14.04it/s] 62%|██████▏   | 427/684 [00:34<00:18, 14.01it/s] 63%|██████▎   | 429/684 [00:34<00:18, 13.96it/s] 63%|██████▎   | 431/684 [00:34<00:18, 13.91it/s] 63%|██████▎   | 433/684 [00:34<00:18, 13.87it/s] 64%|██████▎   | 435/684 [00:34<00:17, 13.85it/s] 64%|██████▍   | 437/684 [00:34<00:17, 13.80it/s] 64%|██████▍   | 439/684 [00:34<00:17, 13.80it/s] 64%|██████▍   | 441/684 [00:35<00:17, 13.80it/s] 65%|██████▍   | 443/684 [00:35<00:17, 13.81it/s] 65%|██████▌   | 445/684 [00:35<00:17, 13.83it/s] 65%|██████▌   | 447/684 [00:35<00:16, 13.96it/s] 66%|██████▌   | 449/684 [00:35<00:16, 13.96it/s] 66%|██████▌   | 451/684 [00:35<00:16, 13.89it/s] 66%|██████▌   | 453/684 [00:35<00:16, 13.87it/s] 67%|██████▋   | 455/684 [00:36<00:16, 13.85it/s] 67%|██████▋   | 457/684 [00:38<01:32,  2.44it/s] 67%|██████▋   | 459/684 [00:38<01:09,  3.24it/s] 67%|██████▋   | 461/684 [00:38<00:53,  4.20it/s] 68%|██████▊   | 463/684 [00:38<00:41,  5.29it/s] 68%|██████▊   | 465/684 [00:39<00:34,  6.37it/s] 68%|██████▊   | 467/684 [00:39<00:28,  7.51it/s] 69%|██████▊   | 469/684 [00:39<00:25,  8.53it/s] 69%|██████▉   | 471/684 [00:39<00:22,  9.52it/s] 69%|██████▉   | 473/684 [00:39<00:20, 10.06it/s] 69%|██████▉   | 475/684 [00:39<00:19, 10.69it/s] 70%|██████▉   | 477/684 [00:39<00:18, 11.19it/s] 70%|███████   | 479/684 [00:40<00:18, 11.27it/s] 70%|███████   | 481/684 [00:40<00:17, 11.78it/s] 71%|███████   | 483/684 [00:40<00:17, 11.77it/s] 71%|███████   | 485/684 [00:40<00:16, 12.00it/s] 71%|███████   | 487/684 [00:40<00:16, 12.10it/s] 71%|███████▏  | 489/684 [00:40<00:16, 12.10it/s] 72%|███████▏  | 491/684 [00:41<00:15, 12.24it/s] 72%|███████▏  | 493/684 [00:41<00:15, 12.17it/s] 72%|███████▏  | 495/684 [00:41<00:15, 12.41it/s] 73%|███████▎  | 497/684 [00:41<00:15, 12.44it/s] 73%|███████▎  | 499/684 [00:41<00:14, 12.39it/s]                                                  73%|███████▎  | 500/684 [00:41<00:14, 12.39it/s] 73%|███████▎  | 501/684 [00:41<00:15, 12.18it/s] 74%|███████▎  | 503/684 [00:42<00:14, 12.57it/s] 74%|███████▍  | 505/684 [00:42<00:14, 12.54it/s] 74%|███████▍  | 507/684 [00:42<00:14, 12.49it/s] 74%|███████▍  | 509/684 [00:42<00:14, 12.21it/s] 75%|███████▍  | 511/684 [00:42<00:13, 12.73it/s] 75%|███████▌  | 513/684 [00:42<00:13, 12.47it/s] 75%|███████▌  | 515/684 [00:43<00:13, 12.57it/s] 76%|███████▌  | 517/684 [00:43<00:12, 12.88it/s] 76%|███████▌  | 519/684 [00:43<00:12, 12.69it/s] 76%|███████▌  | 521/684 [00:43<00:12, 12.72it/s] 76%|███████▋  | 523/684 [00:43<00:12, 12.72it/s] 77%|███████▋  | 525/684 [00:43<00:12, 12.68it/s] 77%|███████▋  | 527/684 [00:43<00:12, 13.03it/s] 77%|███████▋  | 529/684 [00:44<00:11, 13.00it/s] 78%|███████▊  | 531/684 [00:44<00:11, 13.22it/s] 78%|███████▊  | 533/684 [00:44<00:11, 13.03it/s] 78%|███████▊  | 535/684 [00:44<00:11, 13.08it/s] 79%|███████▊  | 537/684 [00:44<00:10, 13.41it/s] 79%|███████▉  | 539/684 [00:44<00:10, 13.41it/s] 79%|███████▉  | 541/684 [00:45<00:10, 13.43it/s] 79%|███████▉  | 543/684 [00:45<00:10, 13.44it/s] 80%|███████▉  | 545/684 [00:45<00:10, 13.45it/s] 80%|███████▉  | 547/684 [00:45<00:10, 13.45it/s] 80%|████████  | 549/684 [00:45<00:10, 13.40it/s] 81%|████████  | 551/684 [00:45<00:09, 13.37it/s] 81%|████████  | 553/684 [00:45<00:09, 13.40it/s] 81%|████████  | 555/684 [00:46<00:09, 13.43it/s] 81%|████████▏ | 557/684 [00:46<00:09, 13.47it/s] 82%|████████▏ | 559/684 [00:46<00:09, 13.49it/s] 82%|████████▏ | 561/684 [00:46<00:09, 13.46it/s] 82%|████████▏ | 563/684 [00:46<00:08, 13.47it/s] 83%|████████▎ | 565/684 [00:46<00:08, 13.40it/s] 83%|████████▎ | 567/684 [00:46<00:08, 13.42it/s] 83%|████████▎ | 569/684 [00:47<00:08, 13.46it/s] 83%|████████▎ | 571/684 [00:47<00:08, 13.47it/s] 84%|████████▍ | 573/684 [00:47<00:08, 13.51it/s] 84%|████████▍ | 575/684 [00:47<00:08, 13.49it/s] 84%|████████▍ | 577/684 [00:47<00:07, 13.53it/s] 85%|████████▍ | 579/684 [00:47<00:07, 13.25it/s] 85%|████████▍ | 581/684 [00:48<00:07, 13.30it/s] 85%|████████▌ | 583/684 [00:48<00:07, 13.36it/s] 86%|████████▌ | 585/684 [00:48<00:07, 13.39it/s] 86%|████████▌ | 587/684 [00:48<00:07, 13.44it/s] 86%|████████▌ | 589/684 [00:48<00:07, 13.44it/s] 86%|████████▋ | 591/684 [00:48<00:06, 13.38it/s] 87%|████████▋ | 593/684 [00:48<00:06, 13.39it/s] 87%|████████▋ | 595/684 [00:49<00:06, 13.40it/s] 87%|████████▋ | 597/684 [00:49<00:06, 13.48it/s] 88%|████████▊ | 599/684 [00:49<00:06, 13.50it/s] 88%|████████▊ | 601/684 [00:49<00:06, 13.51it/s] 88%|████████▊ | 603/684 [00:49<00:05, 13.53it/s] 88%|████████▊ | 605/684 [00:49<00:05, 13.52it/s] 89%|████████▊ | 607/684 [00:49<00:05, 13.63it/s] 89%|████████▉ | 609/684 [00:50<00:05, 13.73it/s] 89%|████████▉ | 611/684 [00:50<00:05, 13.76it/s] 90%|████████▉ | 613/684 [00:50<00:05, 13.87it/s] 90%|████████▉ | 615/684 [00:50<00:04, 13.84it/s] 90%|█████████ | 617/684 [00:50<00:04, 13.75it/s] 90%|█████████ | 619/684 [00:50<00:04, 13.68it/s] 91%|█████████ | 621/684 [00:50<00:04, 13.65it/s] 91%|█████████ | 623/684 [00:51<00:04, 13.61it/s] 91%|█████████▏| 625/684 [00:51<00:04, 13.57it/s] 92%|█████████▏| 627/684 [00:51<00:04, 13.52it/s] 92%|█████████▏| 629/684 [00:51<00:04, 13.50it/s] 92%|█████████▏| 631/684 [00:51<00:03, 13.49it/s] 93%|█████████▎| 633/684 [00:51<00:03, 13.51it/s] 93%|█████████▎| 635/684 [00:51<00:03, 13.57it/s] 93%|█████████▎| 637/684 [00:52<00:03, 13.58it/s] 93%|█████████▎| 639/684 [00:52<00:03, 13.60it/s] 94%|█████████▎| 641/684 [00:52<00:03, 13.62it/s] 94%|█████████▍| 643/684 [00:52<00:03, 13.60it/s] 94%|█████████▍| 645/684 [00:52<00:02, 13.63it/s] 95%|█████████▍| 647/684 [00:52<00:02, 13.65it/s] 95%|█████████▍| 649/684 [00:53<00:02, 13.66it/s] 95%|█████████▌| 651/684 [00:53<00:02, 13.68it/s] 95%|█████████▌| 653/684 [00:53<00:02, 13.67it/s] 96%|█████████▌| 655/684 [00:53<00:02, 13.66it/s] 96%|█████████▌| 657/684 [00:53<00:01, 13.67it/s] 96%|█████████▋| 659/684 [00:53<00:01, 13.66it/s] 97%|█████████▋| 661/684 [00:53<00:01, 13.69it/s] 97%|█████████▋| 663/684 [00:54<00:01, 13.61it/s] 97%|█████████▋| 665/684 [00:54<00:01, 13.62it/s] 98%|█████████▊| 667/684 [00:54<00:01, 13.59it/s] 98%|█████████▊| 669/684 [00:54<00:01, 13.59it/s] 98%|█████████▊| 671/684 [00:54<00:00, 13.62it/s] 98%|█████████▊| 673/684 [00:54<00:00, 13.55it/s] 99%|█████████▊| 675/684 [00:54<00:00, 13.56it/s] 99%|█████████▉| 677/684 [00:55<00:00, 13.58it/s] 99%|█████████▉| 679/684 [00:55<00:00, 13.57it/s]100%|█████████▉| 681/684 [00:55<00:00, 13.55it/s]100%|█████████▉| 683/684 [00:55<00:00, 13.55it/s]                                                 100%|██████████| 684/684 [00:58<00:00, 13.55it/s]100%|██████████| 684/684 [00:58<00:00, 11.72it/s]
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:30,  2.16s/it] 19%|█▉        | 3/16 [00:08<00:39,  3.06s/it] 25%|██▌       | 4/16 [00:12<00:42,  3.53s/it] 31%|███▏      | 5/16 [00:17<00:41,  3.81s/it] 38%|███▊      | 6/16 [00:21<00:39,  3.98s/it] 44%|████▍     | 7/16 [00:25<00:36,  4.08s/it] 50%|█████     | 8/16 [00:30<00:33,  4.16s/it] 56%|█████▋    | 9/16 [00:34<00:29,  4.21s/it] 62%|██████▎   | 10/16 [00:38<00:25,  4.24s/it] 69%|██████▉   | 11/16 [00:43<00:21,  4.27s/it] 75%|███████▌  | 12/16 [00:47<00:17,  4.29s/it] 81%|████████▏ | 13/16 [00:51<00:12,  4.29s/it] 88%|████████▊ | 14/16 [00:56<00:08,  4.30s/it] 94%|█████████▍| 15/16 [01:00<00:04,  4.31s/it]100%|██████████| 16/16 [01:03<00:00,  3.93s/it]100%|██████████| 16/16 [01:03<00:00,  3.99s/it]
-/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/optimization.py:411: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning
-  warnings.warn(
-/mnt/storage/aatherton/hf_eng_fra_trans is already a clone of https://huggingface.co/aatherton2024/hf_eng_fra_trans. Make sure you pull the latest changes with `repo.git_pull()`.
-  0%|          | 0/2736 [00:00<?, ?it/s]  0%|          | 1/2736 [00:00<04:54,  9.28it/s]  0%|          | 3/2736 [00:00<04:05, 11.14it/s]  0%|          | 5/2736 [00:00<03:53, 11.68it/s]  0%|          | 7/2736 [00:00<03:46, 12.05it/s]  0%|          | 9/2736 [00:00<03:45, 12.11it/s]  0%|          | 11/2736 [00:00<03:42, 12.27it/s]  0%|          | 13/2736 [00:01<03:41, 12.27it/s]  1%|          | 15/2736 [00:01<03:40, 12.36it/s]  1%|          | 17/2736 [00:01<03:38, 12.42it/s]  1%|          | 19/2736 [00:01<03:39, 12.40it/s]  1%|          | 21/2736 [00:01<03:38, 12.43it/s]  1%|          | 23/2736 [00:01<03:37, 12.49it/s]  1%|          | 25/2736 [00:02<03:36, 12.55it/s]  1%|          | 27/2736 [00:02<03:35, 12.58it/s]  1%|          | 29/2736 [00:02<03:34, 12.62it/s]  1%|          | 31/2736 [00:02<03:34, 12.59it/s]  1%|          | 33/2736 [00:02<03:35, 12.52it/s]  1%|▏         | 35/2736 [00:02<03:35, 12.52it/s]  1%|▏         | 37/2736 [00:02<03:35, 12.52it/s]  1%|▏         | 39/2736 [00:03<03:38, 12.36it/s]  1%|▏         | 41/2736 [00:03<03:39, 12.26it/s]  2%|▏         | 43/2736 [00:03<03:39, 12.28it/s]  2%|▏         | 45/2736 [00:03<03:38, 12.34it/s]slurmstepd-dl: error: *** JOB 1562 ON dl CANCELLED AT 2023-09-17T19:46:47 ***
diff --git a/myerrors_1563.out b/myerrors_1563.out
deleted file mode 100644
index 868fe83e911a189e97737c564af148aa235a558d..0000000000000000000000000000000000000000
--- a/myerrors_1563.out
+++ /dev/null
@@ -1,161 +0,0 @@
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:31,  2.24s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.13s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.59s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.84s/it] 38%|███▊      | 6/16 [00:21<00:39,  4.00s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.12s/it] 50%|█████     | 8/16 [00:30<00:33,  4.20s/it] 56%|█████▋    | 9/16 [00:34<00:29,  4.25s/it] 62%|██████▎   | 10/16 [00:39<00:25,  4.29s/it] 69%|██████▉   | 11/16 [00:43<00:21,  4.31s/it] 75%|███████▌  | 12/16 [00:48<00:17,  4.32s/it] 81%|████████▏ | 13/16 [00:52<00:13,  4.34s/it] 88%|████████▊ | 14/16 [00:56<00:08,  4.34s/it] 94%|█████████▍| 15/16 [01:01<00:04,  4.35s/it]100%|██████████| 16/16 [01:04<00:00,  3.97s/it]100%|██████████| 16/16 [01:04<00:00,  4.03s/it]
-  0%|          | 0/684 [00:00<?, ?it/s]  0%|          | 1/684 [00:00<02:37,  4.33it/s]  0%|          | 3/684 [00:00<01:17,  8.83it/s]  1%|          | 5/684 [00:00<01:02, 10.79it/s]  1%|          | 7/684 [00:00<00:57, 11.87it/s]  1%|▏         | 9/684 [00:00<00:54, 12.47it/s]  2%|▏         | 11/684 [00:00<00:52, 12.89it/s]  2%|▏         | 13/684 [00:01<00:51, 13.12it/s]  2%|▏         | 15/684 [00:01<00:50, 13.31it/s]  2%|▏         | 17/684 [00:01<00:49, 13.43it/s]  3%|▎         | 19/684 [00:01<00:49, 13.52it/s]  3%|▎         | 21/684 [00:01<00:48, 13.59it/s]  3%|▎         | 23/684 [00:01<00:48, 13.60it/s]  4%|▎         | 25/684 [00:01<00:48, 13.61it/s]  4%|▍         | 27/684 [00:02<00:48, 13.66it/s]  4%|▍         | 29/684 [00:02<00:47, 13.67it/s]  5%|▍         | 31/684 [00:02<00:47, 13.69it/s]  5%|▍         | 33/684 [00:02<00:47, 13.65it/s]  5%|▌         | 35/684 [00:02<00:46, 13.82it/s]  5%|▌         | 37/684 [00:02<00:46, 13.93it/s]  6%|▌         | 39/684 [00:02<00:46, 13.98it/s]  6%|▌         | 41/684 [00:03<00:45, 14.01it/s]  6%|▋         | 43/684 [00:03<00:45, 14.04it/s]  7%|▋         | 45/684 [00:03<00:45, 13.94it/s]  7%|▋         | 47/684 [00:03<00:45, 13.90it/s]  7%|▋         | 49/684 [00:03<00:45, 13.83it/s]  7%|▋         | 51/684 [00:03<00:45, 13.85it/s]  8%|▊         | 53/684 [00:03<00:45, 13.88it/s]  8%|▊         | 55/684 [00:04<00:45, 13.77it/s]  8%|▊         | 57/684 [00:04<00:45, 13.78it/s]  9%|▊         | 59/684 [00:04<00:45, 13.77it/s]  9%|▉         | 61/684 [00:04<00:45, 13.84it/s]  9%|▉         | 63/684 [00:04<00:44, 13.94it/s] 10%|▉         | 65/684 [00:04<00:44, 13.99it/s] 10%|▉         | 67/684 [00:05<00:44, 14.01it/s] 10%|█         | 69/684 [00:05<00:43, 14.00it/s] 10%|█         | 71/684 [00:05<00:43, 14.09it/s] 11%|█         | 73/684 [00:05<00:43, 14.03it/s] 11%|█         | 75/684 [00:05<00:43, 13.96it/s] 11%|█▏        | 77/684 [00:05<00:43, 13.85it/s] 12%|█▏        | 79/684 [00:05<00:43, 13.86it/s] 12%|█▏        | 81/684 [00:06<00:43, 13.81it/s] 12%|█▏        | 83/684 [00:06<00:43, 13.85it/s] 12%|█▏        | 85/684 [00:06<00:43, 13.82it/s] 13%|█▎        | 87/684 [00:06<00:43, 13.80it/s] 13%|█▎        | 89/684 [00:06<00:43, 13.78it/s] 13%|█▎        | 91/684 [00:06<00:43, 13.78it/s] 14%|█▎        | 93/684 [00:06<00:42, 13.82it/s] 14%|█▍        | 95/684 [00:07<00:42, 13.83it/s] 14%|█▍        | 97/684 [00:07<00:42, 13.84it/s] 14%|█▍        | 99/684 [00:07<00:42, 13.76it/s] 15%|█▍        | 101/684 [00:07<00:42, 13.76it/s] 15%|█▌        | 103/684 [00:07<00:42, 13.74it/s] 15%|█▌        | 105/684 [00:07<00:42, 13.76it/s] 16%|█▌        | 107/684 [00:07<00:41, 13.82it/s] 16%|█▌        | 109/684 [00:08<00:41, 13.78it/s] 16%|█▌        | 111/684 [00:08<00:41, 13.76it/s] 17%|█▋        | 113/684 [00:08<00:41, 13.74it/s] 17%|█▋        | 115/684 [00:08<00:41, 13.79it/s] 17%|█▋        | 117/684 [00:08<00:41, 13.73it/s] 17%|█▋        | 119/684 [00:08<00:40, 13.81it/s] 18%|█▊        | 121/684 [00:08<00:40, 13.77it/s] 18%|█▊        | 123/684 [00:09<00:40, 13.76it/s] 18%|█▊        | 125/684 [00:09<00:40, 13.83it/s] 19%|█▊        | 127/684 [00:09<00:39, 13.98it/s] 19%|█▉        | 129/684 [00:09<00:39, 13.93it/s] 19%|█▉        | 131/684 [00:09<00:39, 13.85it/s] 19%|█▉        | 133/684 [00:09<00:39, 13.80it/s] 20%|█▉        | 135/684 [00:09<00:39, 13.78it/s] 20%|██        | 137/684 [00:10<00:39, 13.74it/s] 20%|██        | 139/684 [00:10<00:39, 13.78it/s] 21%|██        | 141/684 [00:10<00:39, 13.79it/s] 21%|██        | 143/684 [00:10<00:39, 13.76it/s] 21%|██        | 145/684 [00:10<00:39, 13.75it/s] 21%|██▏       | 147/684 [00:10<00:38, 13.77it/s] 22%|██▏       | 149/684 [00:10<00:40, 13.20it/s] 22%|██▏       | 151/684 [00:11<00:39, 13.33it/s] 22%|██▏       | 153/684 [00:11<00:39, 13.50it/s] 23%|██▎       | 155/684 [00:11<00:38, 13.57it/s] 23%|██▎       | 157/684 [00:11<00:38, 13.62it/s] 23%|██▎       | 159/684 [00:11<00:38, 13.72it/s] 24%|██▎       | 161/684 [00:11<00:37, 13.80it/s] 24%|██▍       | 163/684 [00:11<00:37, 13.76it/s] 24%|██▍       | 165/684 [00:12<00:37, 13.76it/s] 24%|██▍       | 167/684 [00:12<00:37, 13.78it/s] 25%|██▍       | 169/684 [00:12<00:37, 13.83it/s] 25%|██▌       | 171/684 [00:12<00:36, 13.96it/s] 25%|██▌       | 173/684 [00:12<00:36, 13.89it/s] 26%|██▌       | 175/684 [00:12<00:36, 13.85it/s] 26%|██▌       | 177/684 [00:12<00:36, 13.85it/s] 26%|██▌       | 179/684 [00:13<00:36, 13.81it/s] 26%|██▋       | 181/684 [00:13<00:36, 13.78it/s] 27%|██▋       | 183/684 [00:13<00:36, 13.83it/s] 27%|██▋       | 185/684 [00:13<00:36, 13.82it/s] 27%|██▋       | 187/684 [00:13<00:36, 13.79it/s] 28%|██▊       | 189/684 [00:13<00:35, 13.78it/s] 28%|██▊       | 191/684 [00:14<00:35, 13.76it/s] 28%|██▊       | 193/684 [00:14<00:35, 13.74it/s] 29%|██▊       | 195/684 [00:14<00:35, 13.72it/s] 29%|██▉       | 197/684 [00:14<00:35, 13.78it/s] 29%|██▉       | 199/684 [00:14<00:35, 13.78it/s] 29%|██▉       | 201/684 [00:14<00:35, 13.78it/s] 30%|██▉       | 203/684 [00:14<00:34, 13.77it/s] 30%|██▉       | 205/684 [00:15<00:34, 13.76it/s] 30%|███       | 207/684 [00:15<00:34, 13.72it/s] 31%|███       | 209/684 [00:15<00:34, 13.75it/s] 31%|███       | 211/684 [00:15<00:34, 13.77it/s] 31%|███       | 213/684 [00:15<00:34, 13.80it/s] 31%|███▏      | 215/684 [00:15<00:34, 13.78it/s] 32%|███▏      | 217/684 [00:15<00:33, 13.77it/s] 32%|███▏      | 219/684 [00:16<00:33, 13.78it/s] 32%|███▏      | 221/684 [00:16<00:33, 13.74it/s] 33%|███▎      | 223/684 [00:16<00:33, 13.77it/s] 33%|███▎      | 225/684 [00:16<00:34, 13.45it/s] 33%|███▎      | 227/684 [00:16<00:34, 13.25it/s] 33%|███▎      | 229/684 [00:18<03:04,  2.46it/s] 34%|███▍      | 231/684 [00:19<02:18,  3.27it/s] 34%|███▍      | 233/684 [00:19<01:46,  4.23it/s] 34%|███▍      | 235/684 [00:19<01:23,  5.36it/s] 35%|███▍      | 237/684 [00:19<01:08,  6.56it/s] 35%|███▍      | 239/684 [00:19<00:58,  7.63it/s] 35%|███▌      | 241/684 [00:19<00:50,  8.81it/s] 36%|███▌      | 243/684 [00:20<00:46,  9.58it/s] 36%|███▌      | 245/684 [00:20<00:41, 10.59it/s] 36%|███▌      | 247/684 [00:20<00:39, 11.09it/s] 36%|███▋      | 249/684 [00:20<00:37, 11.68it/s] 37%|███▋      | 251/684 [00:20<00:36, 11.84it/s] 37%|███▋      | 253/684 [00:20<00:35, 12.10it/s] 37%|███▋      | 255/684 [00:20<00:34, 12.27it/s] 38%|███▊      | 257/684 [00:21<00:34, 12.51it/s] 38%|███▊      | 259/684 [00:21<00:33, 12.71it/s] 38%|███▊      | 261/684 [00:21<00:32, 13.07it/s] 38%|███▊      | 263/684 [00:21<00:31, 13.27it/s] 39%|███▊      | 265/684 [00:21<00:32, 13.00it/s] 39%|███▉      | 267/684 [00:21<00:31, 13.29it/s] 39%|███▉      | 269/684 [00:22<00:30, 13.48it/s] 40%|███▉      | 271/684 [00:22<00:31, 13.23it/s] 40%|███▉      | 273/684 [00:22<00:31, 13.24it/s] 40%|████      | 275/684 [00:22<00:31, 13.16it/s] 40%|████      | 277/684 [00:22<00:30, 13.48it/s] 41%|████      | 279/684 [00:22<00:30, 13.15it/s] 41%|████      | 281/684 [00:22<00:30, 13.02it/s] 41%|████▏     | 283/684 [00:23<00:30, 13.35it/s] 42%|████▏     | 285/684 [00:23<00:29, 13.50it/s] 42%|████▏     | 287/684 [00:23<00:30, 13.23it/s] 42%|████▏     | 289/684 [00:23<00:29, 13.48it/s] 43%|████▎     | 291/684 [00:23<00:29, 13.19it/s] 43%|████▎     | 293/684 [00:23<00:29, 13.46it/s] 43%|████▎     | 295/684 [00:23<00:29, 13.08it/s] 43%|████▎     | 297/684 [00:24<00:29, 12.94it/s] 44%|████▎     | 299/684 [00:24<00:29, 13.03it/s] 44%|████▍     | 301/684 [00:24<00:29, 12.85it/s] 44%|████▍     | 303/684 [00:24<00:29, 12.70it/s] 45%|████▍     | 305/684 [00:24<00:30, 12.35it/s] 45%|████▍     | 307/684 [00:24<00:30, 12.26it/s] 45%|████▌     | 309/684 [00:25<00:30, 12.17it/s] 45%|████▌     | 311/684 [00:25<00:31, 12.02it/s] 46%|████▌     | 313/684 [00:25<00:30, 12.10it/s] 46%|████▌     | 315/684 [00:25<00:30, 12.19it/s] 46%|████▋     | 317/684 [00:25<00:30, 12.20it/s] 47%|████▋     | 319/684 [00:25<00:30, 12.06it/s] 47%|████▋     | 321/684 [00:26<00:29, 12.33it/s] 47%|████▋     | 323/684 [00:26<00:28, 12.50it/s] 48%|████▊     | 325/684 [00:26<00:27, 12.84it/s] 48%|████▊     | 327/684 [00:26<00:27, 13.08it/s] 48%|████▊     | 329/684 [00:26<00:26, 13.26it/s] 48%|████▊     | 331/684 [00:26<00:26, 13.41it/s] 49%|████▊     | 333/684 [00:26<00:25, 13.51it/s] 49%|████▉     | 335/684 [00:27<00:25, 13.65it/s] 49%|████▉     | 337/684 [00:27<00:25, 13.77it/s] 50%|████▉     | 339/684 [00:27<00:24, 13.83it/s] 50%|████▉     | 341/684 [00:27<00:24, 13.80it/s] 50%|█████     | 343/684 [00:27<00:24, 13.75it/s] 50%|█████     | 345/684 [00:27<00:24, 13.78it/s] 51%|█████     | 347/684 [00:28<00:24, 13.72it/s] 51%|█████     | 349/684 [00:28<00:24, 13.71it/s] 51%|█████▏    | 351/684 [00:28<00:24, 13.73it/s] 52%|█████▏    | 353/684 [00:28<00:24, 13.67it/s] 52%|█████▏    | 355/684 [00:28<00:24, 13.67it/s] 52%|█████▏    | 357/684 [00:28<00:23, 13.69it/s] 52%|█████▏    | 359/684 [00:28<00:23, 13.69it/s] 53%|█████▎    | 361/684 [00:29<00:23, 13.73it/s] 53%|█████▎    | 363/684 [00:29<00:23, 13.73it/s] 53%|█████▎    | 365/684 [00:29<00:23, 13.71it/s] 54%|█████▎    | 367/684 [00:29<00:23, 13.73it/s] 54%|█████▍    | 369/684 [00:29<00:23, 13.66it/s] 54%|█████▍    | 371/684 [00:29<00:22, 13.65it/s] 55%|█████▍    | 373/684 [00:29<00:22, 13.70it/s] 55%|█████▍    | 375/684 [00:30<00:22, 13.65it/s] 55%|█████▌    | 377/684 [00:30<00:22, 13.73it/s] 55%|█████▌    | 379/684 [00:30<00:22, 13.69it/s] 56%|█████▌    | 381/684 [00:30<00:22, 13.73it/s] 56%|█████▌    | 383/684 [00:30<00:21, 13.74it/s] 56%|█████▋    | 385/684 [00:30<00:21, 13.77it/s] 57%|█████▋    | 387/684 [00:30<00:21, 13.78it/s] 57%|█████▋    | 389/684 [00:31<00:21, 13.78it/s] 57%|█████▋    | 391/684 [00:31<00:21, 13.76it/s] 57%|█████▋    | 393/684 [00:31<00:21, 13.74it/s] 58%|█████▊    | 395/684 [00:31<00:21, 13.75it/s] 58%|█████▊    | 397/684 [00:31<00:20, 13.76it/s] 58%|█████▊    | 399/684 [00:31<00:20, 13.78it/s] 59%|█████▊    | 401/684 [00:31<00:20, 13.85it/s] 59%|█████▉    | 403/684 [00:32<00:20, 13.75it/s] 59%|█████▉    | 405/684 [00:32<00:20, 13.77it/s] 60%|█████▉    | 407/684 [00:32<00:20, 13.73it/s] 60%|█████▉    | 409/684 [00:32<00:20, 13.75it/s] 60%|██████    | 411/684 [00:32<00:19, 13.70it/s] 60%|██████    | 413/684 [00:32<00:19, 13.70it/s] 61%|██████    | 415/684 [00:32<00:19, 13.72it/s] 61%|██████    | 417/684 [00:33<00:19, 13.78it/s] 61%|██████▏   | 419/684 [00:33<00:18, 13.97it/s] 62%|██████▏   | 421/684 [00:33<00:18, 13.89it/s] 62%|██████▏   | 423/684 [00:33<00:18, 13.84it/s] 62%|██████▏   | 425/684 [00:33<00:18, 13.75it/s] 62%|██████▏   | 427/684 [00:33<00:18, 13.74it/s] 63%|██████▎   | 429/684 [00:33<00:18, 13.75it/s] 63%|██████▎   | 431/684 [00:34<00:18, 13.72it/s] 63%|██████▎   | 433/684 [00:34<00:18, 13.75it/s] 64%|██████▎   | 435/684 [00:34<00:18, 13.76it/s] 64%|██████▍   | 437/684 [00:34<00:17, 13.74it/s] 64%|██████▍   | 439/684 [00:34<00:17, 13.75it/s] 64%|██████▍   | 441/684 [00:34<00:17, 13.74it/s] 65%|██████▍   | 443/684 [00:34<00:17, 13.75it/s] 65%|██████▌   | 445/684 [00:35<00:17, 13.79it/s] 65%|██████▌   | 447/684 [00:35<00:16, 13.96it/s] 66%|██████▌   | 449/684 [00:35<00:16, 13.92it/s] 66%|██████▌   | 451/684 [00:35<00:16, 13.83it/s] 66%|██████▌   | 453/684 [00:35<00:16, 13.80it/s] 67%|██████▋   | 455/684 [00:35<00:16, 13.74it/s] 67%|██████▋   | 457/684 [00:38<01:31,  2.49it/s] 67%|██████▋   | 459/684 [00:38<01:08,  3.31it/s] 67%|██████▋   | 461/684 [00:38<00:52,  4.28it/s] 68%|██████▊   | 463/684 [00:38<00:41,  5.39it/s] 68%|██████▊   | 465/684 [00:38<00:33,  6.52it/s] 68%|██████▊   | 467/684 [00:38<00:28,  7.69it/s] 69%|██████▊   | 469/684 [00:39<00:24,  8.67it/s] 69%|██████▉   | 471/684 [00:39<00:22,  9.63it/s] 69%|██████▉   | 473/684 [00:39<00:20, 10.16it/s] 69%|██████▉   | 475/684 [00:39<00:19, 10.79it/s] 70%|██████▉   | 477/684 [00:39<00:18, 11.25it/s] 70%|███████   | 479/684 [00:39<00:18, 11.22it/s] 70%|███████   | 481/684 [00:40<00:17, 11.51it/s] 71%|███████   | 483/684 [00:40<00:17, 11.64it/s] 71%|███████   | 485/684 [00:40<00:17, 11.63it/s] 71%|███████   | 487/684 [00:40<00:16, 11.81it/s] 71%|███████▏  | 489/684 [00:40<00:15, 12.42it/s] 72%|███████▏  | 491/684 [00:40<00:15, 12.31it/s] 72%|███████▏  | 493/684 [00:41<00:15, 12.35it/s] 72%|███████▏  | 495/684 [00:41<00:14, 12.83it/s] 73%|███████▎  | 497/684 [00:41<00:14, 12.73it/s] 73%|███████▎  | 499/684 [00:41<00:14, 13.01it/s]                                                  73%|███████▎  | 500/684 [00:41<00:14, 13.01it/s] 73%|███████▎  | 501/684 [00:41<00:14, 12.73it/s] 74%|███████▎  | 503/684 [00:41<00:14, 12.82it/s] 74%|███████▍  | 505/684 [00:41<00:13, 12.99it/s] 74%|███████▍  | 507/684 [00:42<00:13, 12.67it/s] 74%|███████▍  | 509/684 [00:42<00:13, 12.86it/s] 75%|███████▍  | 511/684 [00:42<00:13, 12.84it/s] 75%|███████▌  | 513/684 [00:42<00:13, 12.96it/s] 75%|███████▌  | 515/684 [00:42<00:13, 12.77it/s] 76%|███████▌  | 517/684 [00:42<00:12, 12.88it/s] 76%|███████▌  | 519/684 [00:43<00:12, 12.99it/s] 76%|███████▌  | 521/684 [00:43<00:12, 12.77it/s] 76%|███████▋  | 523/684 [00:43<00:12, 13.11it/s] 77%|███████▋  | 525/684 [00:43<00:12, 12.88it/s] 77%|███████▋  | 527/684 [00:43<00:12, 12.81it/s] 77%|███████▋  | 529/684 [00:43<00:11, 13.01it/s] 78%|███████▊  | 531/684 [00:43<00:11, 13.12it/s] 78%|███████▊  | 533/684 [00:44<00:11, 13.01it/s] 78%|███████▊  | 535/684 [00:44<00:11, 13.22it/s] 79%|███████▊  | 537/684 [00:44<00:10, 13.44it/s] 79%|███████▉  | 539/684 [00:44<00:10, 13.60it/s] 79%|███████▉  | 541/684 [00:44<00:10, 13.77it/s] 79%|███████▉  | 543/684 [00:44<00:10, 13.71it/s] 80%|███████▉  | 545/684 [00:45<00:10, 13.81it/s] 80%|███████▉  | 547/684 [00:45<00:09, 13.92it/s] 80%|████████  | 549/684 [00:45<00:09, 13.89it/s] 81%|████████  | 551/684 [00:45<00:09, 13.99it/s] 81%|████████  | 553/684 [00:45<00:09, 14.05it/s] 81%|████████  | 555/684 [00:45<00:09, 14.03it/s] 81%|████████▏ | 557/684 [00:45<00:09, 14.07it/s] 82%|████████▏ | 559/684 [00:46<00:08, 13.97it/s] 82%|████████▏ | 561/684 [00:46<00:08, 13.87it/s] 82%|████████▏ | 563/684 [00:46<00:08, 13.92it/s] 83%|████████▎ | 565/684 [00:46<00:08, 13.98it/s] 83%|████████▎ | 567/684 [00:46<00:08, 13.94it/s] 83%|████████▎ | 569/684 [00:46<00:08, 14.01it/s] 83%|████████▎ | 571/684 [00:46<00:08, 13.98it/s] 84%|████████▍ | 573/684 [00:47<00:08, 13.86it/s] 84%|████████▍ | 575/684 [00:47<00:07, 13.80it/s] 84%|████████▍ | 577/684 [00:47<00:07, 13.70it/s] 85%|████████▍ | 579/684 [00:47<00:07, 13.63it/s] 85%|████████▍ | 581/684 [00:47<00:07, 13.63it/s] 85%|████████▌ | 583/684 [00:47<00:07, 13.66it/s] 86%|████████▌ | 585/684 [00:47<00:07, 13.74it/s] 86%|████████▌ | 587/684 [00:48<00:06, 13.87it/s] 86%|████████▌ | 589/684 [00:48<00:06, 13.83it/s] 86%|████████▋ | 591/684 [00:48<00:06, 13.76it/s] 87%|████████▋ | 593/684 [00:48<00:06, 13.71it/s] 87%|████████▋ | 595/684 [00:48<00:06, 13.70it/s] 87%|████████▋ | 597/684 [00:48<00:06, 13.64it/s] 88%|████████▊ | 599/684 [00:48<00:06, 13.63it/s] 88%|████████▊ | 601/684 [00:49<00:06, 13.58it/s] 88%|████████▊ | 603/684 [00:49<00:05, 13.56it/s] 88%|████████▊ | 605/684 [00:49<00:05, 13.56it/s] 89%|████████▊ | 607/684 [00:49<00:05, 13.75it/s] 89%|████████▉ | 609/684 [00:49<00:05, 13.76it/s] 89%|████████▉ | 611/684 [00:49<00:05, 13.72it/s] 90%|████████▉ | 613/684 [00:49<00:05, 13.69it/s] 90%|████████▉ | 615/684 [00:50<00:04, 13.93it/s] 90%|█████████ | 617/684 [00:50<00:04, 14.00it/s] 90%|█████████ | 619/684 [00:50<00:04, 13.96it/s] 91%|█████████ | 621/684 [00:50<00:04, 14.03it/s] 91%|█████████ | 623/684 [00:50<00:04, 13.93it/s] 91%|█████████▏| 625/684 [00:50<00:04, 13.94it/s] 92%|█████████▏| 627/684 [00:50<00:04, 13.77it/s] 92%|█████████▏| 629/684 [00:51<00:03, 13.82it/s] 92%|█████████▏| 631/684 [00:51<00:03, 13.82it/s] 93%|█████████▎| 633/684 [00:51<00:03, 13.70it/s] 93%|█████████▎| 635/684 [00:51<00:03, 13.63it/s] 93%|█████████▎| 637/684 [00:51<00:03, 13.64it/s] 93%|█████████▎| 639/684 [00:51<00:03, 13.62it/s] 94%|█████████▎| 641/684 [00:51<00:03, 13.69it/s] 94%|█████████▍| 643/684 [00:52<00:02, 13.81it/s] 94%|█████████▍| 645/684 [00:52<00:02, 13.73it/s] 95%|█████████▍| 647/684 [00:52<00:02, 13.71it/s] 95%|█████████▍| 649/684 [00:52<00:02, 13.68it/s] 95%|█████████▌| 651/684 [00:52<00:02, 13.60it/s] 95%|█████████▌| 653/684 [00:52<00:02, 13.53it/s] 96%|█████████▌| 655/684 [00:52<00:02, 13.53it/s] 96%|█████████▌| 657/684 [00:53<00:01, 13.55it/s] 96%|█████████▋| 659/684 [00:53<00:01, 13.53it/s] 97%|█████████▋| 661/684 [00:53<00:01, 13.51it/s] 97%|█████████▋| 663/684 [00:53<00:01, 13.52it/s] 97%|█████████▋| 665/684 [00:53<00:01, 13.48it/s] 98%|█████████▊| 667/684 [00:53<00:01, 13.35it/s] 98%|█████████▊| 669/684 [00:54<00:01, 13.33it/s] 98%|█████████▊| 671/684 [00:54<00:00, 13.38it/s] 98%|█████████▊| 673/684 [00:54<00:00, 13.40it/s] 99%|█████████▊| 675/684 [00:54<00:00, 13.43it/s] 99%|█████████▉| 677/684 [00:54<00:00, 13.49it/s] 99%|█████████▉| 679/684 [00:54<00:00, 13.49it/s]100%|█████████▉| 681/684 [00:54<00:00, 13.48it/s]100%|█████████▉| 683/684 [00:55<00:00, 13.42it/s]                                                 100%|██████████| 684/684 [00:57<00:00, 13.42it/s]100%|██████████| 684/684 [00:57<00:00, 11.81it/s]
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:30,  2.21s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.12s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.59s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.88s/it] 38%|███▊      | 6/16 [00:22<00:40,  4.06s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.17s/it] 50%|█████     | 8/16 [00:30<00:33,  4.24s/it] 56%|█████▋    | 9/16 [00:35<00:30,  4.29s/it] 62%|██████▎   | 10/16 [00:39<00:25,  4.32s/it] 69%|██████▉   | 11/16 [00:44<00:21,  4.35s/it] 75%|███████▌  | 12/16 [00:48<00:17,  4.36s/it] 81%|████████▏ | 13/16 [00:52<00:13,  4.38s/it] 88%|████████▊ | 14/16 [00:57<00:08,  4.39s/it] 94%|█████████▍| 15/16 [01:01<00:04,  4.40s/it]100%|██████████| 16/16 [01:04<00:00,  4.01s/it]100%|██████████| 16/16 [01:05<00:00,  4.06s/it]
-/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/optimization.py:411: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning
-  warnings.warn(
-/mnt/storage/aatherton/hf_eng_fra_trans is already a clone of https://huggingface.co/aatherton2024/hf_eng_fra_trans. Make sure you pull the latest changes with `repo.git_pull()`.
-  0%|          | 0/2736 [00:00<?, ?it/s]  0%|          | 2/2736 [00:00<03:57, 11.51it/s]  0%|          | 4/2736 [00:00<03:49, 11.89it/s]  0%|          | 6/2736 [00:00<03:47, 12.00it/s]  0%|          | 8/2736 [00:00<03:46, 12.05it/s]  0%|          | 10/2736 [00:00<03:43, 12.21it/s]  0%|          | 12/2736 [00:00<03:43, 12.19it/s]  1%|          | 14/2736 [00:01<03:43, 12.16it/s]  1%|          | 16/2736 [00:01<03:43, 12.19it/s]  1%|          | 18/2736 [00:01<03:41, 12.25it/s]  1%|          | 20/2736 [00:01<03:42, 12.21it/s]  1%|          | 22/2736 [00:01<03:43, 12.16it/s]  1%|          | 24/2736 [00:01<03:43, 12.16it/s]  1%|          | 26/2736 [00:02<03:41, 12.26it/s]  1%|          | 28/2736 [00:02<03:41, 12.24it/s]  1%|          | 30/2736 [00:02<03:41, 12.21it/s]  1%|          | 32/2736 [00:02<03:41, 12.20it/s]  1%|          | 34/2736 [00:02<03:40, 12.28it/s]  1%|▏         | 36/2736 [00:02<03:39, 12.30it/s]  1%|▏         | 38/2736 [00:03<03:38, 12.35it/s]  1%|▏         | 40/2736 [00:03<03:39, 12.31it/s]  2%|▏         | 42/2736 [00:03<03:39, 12.25it/s]  2%|▏         | 44/2736 [00:03<03:37, 12.37it/s]  2%|▏         | 46/2736 [00:03<03:37, 12.38it/s]  2%|▏         | 48/2736 [00:03<03:36, 12.42it/s]  2%|▏         | 50/2736 [00:04<03:35, 12.47it/s]  2%|▏         | 52/2736 [00:04<03:36, 12.40it/s]  2%|▏         | 54/2736 [00:04<03:35, 12.45it/s]  2%|▏         | 56/2736 [00:04<03:36, 12.39it/s]  2%|▏         | 58/2736 [00:04<03:35, 12.44it/s]  2%|▏         | 60/2736 [00:04<03:36, 12.38it/s]  2%|▏         | 62/2736 [00:05<03:36, 12.36it/s]  2%|▏         | 64/2736 [00:05<03:35, 12.38it/s]  2%|▏         | 66/2736 [00:05<03:36, 12.32it/s]  2%|▏         | 68/2736 [00:05<03:37, 12.25it/s]  3%|▎         | 70/2736 [00:05<03:35, 12.35it/s]  3%|▎         | 72/2736 [00:05<03:35, 12.36it/s]  3%|▎         | 74/2736 [00:06<03:34, 12.40it/s]  3%|▎         | 76/2736 [00:06<03:36, 12.27it/s]  3%|▎         | 78/2736 [00:06<03:37, 12.24it/s]  3%|▎         | 80/2736 [00:06<03:36, 12.28it/s]  3%|▎         | 82/2736 [00:06<03:35, 12.30it/s]  3%|▎         | 84/2736 [00:06<03:37, 12.22it/s]  3%|▎         | 86/2736 [00:07<03:36, 12.25it/s]  3%|▎         | 88/2736 [00:07<03:34, 12.34it/s]  3%|▎         | 90/2736 [00:07<03:35, 12.28it/s]  3%|▎         | 92/2736 [00:07<03:34, 12.33it/s]  3%|▎         | 94/2736 [00:07<03:34, 12.32it/s]  4%|▎         | 96/2736 [00:07<03:34, 12.29it/s]  4%|▎         | 98/2736 [00:07<03:35, 12.27it/s]  4%|▎         | 100/2736 [00:08<03:33, 12.36it/s]  4%|▎         | 102/2736 [00:08<03:33, 12.32it/s]  4%|▍         | 104/2736 [00:08<03:32, 12.40it/s]  4%|▍         | 106/2736 [00:08<03:33, 12.32it/s]  4%|▍         | 108/2736 [00:08<03:34, 12.25it/s]  4%|▍         | 110/2736 [00:08<03:35, 12.20it/s]  4%|▍         | 112/2736 [00:09<03:32, 12.36it/s]  4%|▍         | 114/2736 [00:09<03:33, 12.28it/s]  4%|▍         | 116/2736 [00:09<03:33, 12.26it/s]  4%|▍         | 118/2736 [00:09<03:32, 12.33it/s]  4%|▍         | 120/2736 [00:09<03:32, 12.30it/s]  4%|▍         | 122/2736 [00:09<03:31, 12.36it/s]  5%|▍         | 124/2736 [00:10<03:31, 12.33it/s]  5%|▍         | 126/2736 [00:10<03:32, 12.28it/s]  5%|▍         | 128/2736 [00:10<03:31, 12.33it/s]  5%|▍         | 130/2736 [00:10<03:30, 12.36it/s]  5%|▍         | 132/2736 [00:10<03:29, 12.41it/s]  5%|▍         | 134/2736 [00:10<03:30, 12.35it/s]  5%|▍         | 136/2736 [00:11<03:29, 12.41it/s]  5%|▌         | 138/2736 [00:11<03:30, 12.34it/s]  5%|▌         | 140/2736 [00:11<03:28, 12.45it/s]  5%|▌         | 142/2736 [00:11<03:29, 12.38it/s]  5%|▌         | 144/2736 [00:11<03:28, 12.44it/s]  5%|▌         | 146/2736 [00:11<03:29, 12.37it/s]  5%|▌         | 148/2736 [00:12<03:27, 12.45it/s]  5%|▌         | 150/2736 [00:12<03:28, 12.39it/s]  6%|▌         | 152/2736 [00:12<03:29, 12.33it/s]  6%|▌         | 154/2736 [00:12<03:30, 12.25it/s]  6%|▌         | 156/2736 [00:12<03:31, 12.21it/s]  6%|▌         | 158/2736 [00:12<03:29, 12.32it/s]  6%|▌         | 160/2736 [00:13<03:29, 12.31it/s]  6%|▌         | 162/2736 [00:13<03:27, 12.42it/s]  6%|▌         | 164/2736 [00:13<03:28, 12.34it/s]  6%|▌         | 166/2736 [00:13<03:27, 12.40it/s]  6%|▌         | 168/2736 [00:13<03:27, 12.38it/s]  6%|▌         | 170/2736 [00:13<03:28, 12.34it/s]  6%|▋         | 172/2736 [00:13<03:26, 12.41it/s]  6%|▋         | 174/2736 [00:14<03:27, 12.34it/s]  6%|▋         | 176/2736 [00:14<03:29, 12.24it/s]  7%|▋         | 178/2736 [00:14<03:29, 12.21it/s]  7%|▋         | 180/2736 [00:14<03:28, 12.25it/s]  7%|▋         | 182/2736 [00:14<03:27, 12.33it/s]  7%|▋         | 184/2736 [00:14<03:27, 12.27it/s]  7%|▋         | 186/2736 [00:15<03:26, 12.35it/s]  7%|▋         | 188/2736 [00:15<03:27, 12.28it/s]  7%|▋         | 190/2736 [00:15<03:27, 12.26it/s]  7%|▋         | 192/2736 [00:15<03:27, 12.24it/s]  7%|▋         | 194/2736 [00:15<03:25, 12.35it/s]  7%|▋         | 196/2736 [00:15<03:24, 12.40it/s]  7%|▋         | 198/2736 [00:16<03:25, 12.38it/s]  7%|▋         | 200/2736 [00:16<03:23, 12.45it/s]  7%|▋         | 202/2736 [00:16<03:24, 12.37it/s]  7%|▋         | 204/2736 [00:16<03:25, 12.30it/s]  8%|▊         | 206/2736 [00:16<03:24, 12.38it/s]  8%|▊         | 208/2736 [00:16<03:24, 12.34it/s]  8%|▊         | 210/2736 [00:17<03:23, 12.42it/s]  8%|▊         | 212/2736 [00:17<03:24, 12.35it/s]  8%|▊         | 214/2736 [00:17<03:23, 12.37it/s]  8%|▊         | 216/2736 [00:17<03:24, 12.35it/s]  8%|▊         | 218/2736 [00:17<03:24, 12.29it/s]  8%|▊         | 220/2736 [00:17<03:22, 12.41it/s]  8%|▊         | 222/2736 [00:18<03:23, 12.33it/s]  8%|▊         | 224/2736 [00:18<03:22, 12.41it/s]  8%|▊         | 226/2736 [00:18<03:23, 12.35it/s]  8%|▊         | 228/2736 [00:18<03:24, 12.29it/s]  8%|▊         | 230/2736 [00:18<03:21, 12.41it/s]  8%|▊         | 232/2736 [00:18<03:23, 12.33it/s]  9%|▊         | 234/2736 [00:19<03:22, 12.34it/s]  9%|▊         | 236/2736 [00:19<03:21, 12.39it/s]  9%|▊         | 238/2736 [00:19<03:22, 12.33it/s]  9%|▉         | 240/2736 [00:19<03:21, 12.36it/s]  9%|▉         | 242/2736 [00:19<03:22, 12.35it/s]  9%|▉         | 244/2736 [00:19<03:22, 12.33it/s]  9%|▉         | 246/2736 [00:19<03:21, 12.36it/s]  9%|▉         | 248/2736 [00:20<03:22, 12.28it/s]  9%|▉         | 250/2736 [00:20<03:20, 12.38it/s]  9%|▉         | 252/2736 [00:20<03:21, 12.32it/s]  9%|▉         | 254/2736 [00:20<03:21, 12.31it/s]  9%|▉         | 256/2736 [00:20<03:20, 12.36it/s]  9%|▉         | 258/2736 [00:20<03:21, 12.32it/s] 10%|▉         | 260/2736 [00:21<03:19, 12.39it/s] 10%|▉         | 262/2736 [00:21<03:20, 12.33it/s] 10%|▉         | 264/2736 [00:21<03:19, 12.39it/s] 10%|▉         | 266/2736 [00:21<03:20, 12.32it/s] 10%|▉         | 268/2736 [00:21<03:18, 12.46it/s] 10%|▉         | 270/2736 [00:21<03:19, 12.37it/s] 10%|▉         | 272/2736 [00:22<03:20, 12.29it/s] 10%|█         | 274/2736 [00:22<03:19, 12.36it/s] 10%|█         | 276/2736 [00:22<03:20, 12.30it/s] 10%|█         | 278/2736 [00:22<03:18, 12.40it/s] 10%|█         | 280/2736 [00:22<03:19, 12.33it/s] 10%|█         | 282/2736 [00:22<03:18, 12.34it/s] 10%|█         | 284/2736 [00:23<03:18, 12.38it/s] 10%|█         | 286/2736 [00:23<03:18, 12.32it/s] 11%|█         | 288/2736 [00:23<03:17, 12.40it/s] 11%|█         | 290/2736 [00:23<03:16, 12.43it/s] 11%|█         | 292/2736 [00:23<03:16, 12.46it/s] 11%|█         | 294/2736 [00:23<03:15, 12.48it/s] 11%|█         | 296/2736 [00:24<03:16, 12.45it/s] 11%|█         | 298/2736 [00:24<03:15, 12.46it/s] 11%|█         | 300/2736 [00:24<03:15, 12.45it/s] 11%|█         | 302/2736 [00:24<03:14, 12.52it/s] 11%|█         | 304/2736 [00:24<03:16, 12.39it/s] 11%|█         | 306/2736 [00:24<03:16, 12.35it/s] 11%|█▏        | 308/2736 [00:24<03:16, 12.37it/s] 11%|█▏        | 310/2736 [00:25<03:15, 12.40it/s] 11%|█▏        | 312/2736 [00:25<03:15, 12.40it/s] 11%|█▏        | 314/2736 [00:25<03:15, 12.39it/s] 12%|█▏        | 316/2736 [00:25<03:14, 12.43it/s] 12%|█▏        | 318/2736 [00:25<03:14, 12.43it/s] 12%|█▏        | 320/2736 [00:25<03:14, 12.43it/s] 12%|█▏        | 322/2736 [00:26<03:15, 12.35it/s] 12%|█▏        | 324/2736 [00:26<03:13, 12.44it/s] 12%|█▏        | 326/2736 [00:26<03:15, 12.35it/s] 12%|█▏        | 328/2736 [00:26<03:15, 12.30it/s] 12%|█▏        | 330/2736 [00:26<03:14, 12.40it/s] 12%|█▏        | 332/2736 [00:26<03:14, 12.34it/s] 12%|█▏        | 334/2736 [00:27<03:13, 12.44it/s] 12%|█▏        | 336/2736 [00:27<03:14, 12.36it/s] 12%|█▏        | 338/2736 [00:27<03:12, 12.43it/s] 12%|█▏        | 340/2736 [00:27<03:13, 12.37it/s] 12%|█▎        | 342/2736 [00:27<03:13, 12.40it/s] 13%|█▎        | 344/2736 [00:27<03:13, 12.35it/s] 13%|█▎        | 346/2736 [00:28<03:14, 12.29it/s] 13%|█▎        | 348/2736 [00:28<03:14, 12.30it/s] 13%|█▎        | 350/2736 [00:28<03:12, 12.37it/s] 13%|█▎        | 352/2736 [00:28<03:13, 12.30it/s] 13%|█▎        | 354/2736 [00:28<03:11, 12.42it/s] 13%|█▎        | 356/2736 [00:28<03:13, 12.32it/s] 13%|█▎        | 358/2736 [00:29<03:11, 12.39it/s] 13%|█▎        | 360/2736 [00:29<03:12, 12.33it/s] 13%|█▎        | 362/2736 [00:29<03:12, 12.34it/s] 13%|█▎        | 364/2736 [00:29<03:11, 12.37it/s] 13%|█▎        | 366/2736 [00:29<03:12, 12.31it/s] 13%|█▎        | 368/2736 [00:29<03:10, 12.41it/s] 14%|█▎        | 370/2736 [00:29<03:12, 12.31it/s] 14%|█▎        | 372/2736 [00:30<03:12, 12.31it/s] 14%|█▎        | 374/2736 [00:30<03:10, 12.38it/s] 14%|█▎        | 376/2736 [00:30<03:11, 12.32it/s] 14%|█▍        | 378/2736 [00:30<03:10, 12.41it/s] 14%|█▍        | 380/2736 [00:30<03:11, 12.33it/s] 14%|█▍        | 382/2736 [00:30<03:12, 12.25it/s] 14%|█▍        | 384/2736 [00:31<03:11, 12.27it/s] 14%|█▍        | 386/2736 [00:31<03:10, 12.33it/s] 14%|█▍        | 388/2736 [00:31<03:11, 12.28it/s] 14%|█▍        | 390/2736 [00:31<03:11, 12.25it/s] 14%|█▍        | 392/2736 [00:31<03:10, 12.28it/s] 14%|█▍        | 394/2736 [00:31<03:09, 12.33it/s] 14%|█▍        | 396/2736 [00:32<03:10, 12.26it/s] 15%|█▍        | 398/2736 [00:32<03:10, 12.29it/s] 15%|█▍        | 400/2736 [00:32<03:09, 12.34it/s] 15%|█▍        | 402/2736 [00:32<03:09, 12.29it/s] 15%|█▍        | 404/2736 [00:32<03:08, 12.39it/s] 15%|█▍        | 406/2736 [00:32<03:09, 12.31it/s] 15%|█▍        | 408/2736 [00:33<03:07, 12.41it/s] 15%|█▍        | 410/2736 [00:33<03:08, 12.36it/s] 15%|█▌        | 412/2736 [00:33<03:06, 12.44it/s] 15%|█▌        | 414/2736 [00:33<03:07, 12.37it/s] 15%|█▌        | 416/2736 [00:33<03:08, 12.31it/s] 15%|█▌        | 418/2736 [00:33<03:06, 12.42it/s] 15%|█▌        | 420/2736 [00:34<03:07, 12.37it/s] 15%|█▌        | 422/2736 [00:34<03:07, 12.32it/s] 15%|█▌        | 424/2736 [00:34<03:06, 12.39it/s] 16%|█▌        | 426/2736 [00:34<03:07, 12.35it/s] 16%|█▌        | 428/2736 [00:34<03:06, 12.40it/s] 16%|█▌        | 430/2736 [00:34<03:06, 12.37it/s] 16%|█▌        | 432/2736 [00:35<03:05, 12.39it/s] 16%|█▌        | 434/2736 [00:35<03:05, 12.39it/s] 16%|█▌        | 436/2736 [00:35<03:06, 12.34it/s] 16%|█▌        | 438/2736 [00:35<03:05, 12.41it/s] 16%|█▌        | 440/2736 [00:35<03:05, 12.35it/s] 16%|█▌        | 442/2736 [00:35<03:07, 12.25it/s] 16%|█▌        | 444/2736 [00:35<03:06, 12.28it/s] 16%|█▋        | 446/2736 [00:36<03:05, 12.35it/s] 16%|█▋        | 448/2736 [00:36<03:04, 12.40it/s] 16%|█▋        | 450/2736 [00:36<03:04, 12.36it/s] 17%|█▋        | 452/2736 [00:36<03:05, 12.30it/s] 17%|█▋        | 454/2736 [00:36<03:06, 12.25it/s] 17%|█▋        | 456/2736 [00:36<03:04, 12.37it/s] 17%|█▋        | 458/2736 [00:37<03:05, 12.31it/s] 17%|█▋        | 460/2736 [00:37<03:03, 12.37it/s] 17%|█▋        | 462/2736 [00:37<03:05, 12.29it/s] 17%|█▋        | 464/2736 [00:37<03:05, 12.23it/s] 17%|█▋        | 466/2736 [00:37<03:05, 12.22it/s] 17%|█▋        | 468/2736 [00:37<03:05, 12.20it/s] 17%|█▋        | 470/2736 [00:38<03:03, 12.33it/s] 17%|█▋        | 472/2736 [00:38<03:03, 12.31it/s] 17%|█▋        | 474/2736 [00:38<03:03, 12.34it/s] 17%|█▋        | 476/2736 [00:38<03:03, 12.34it/s] 17%|█▋        | 478/2736 [00:38<03:02, 12.36it/s] 18%|█▊        | 480/2736 [00:38<03:01, 12.43it/s] 18%|█▊        | 482/2736 [00:39<03:02, 12.37it/s] 18%|█▊        | 484/2736 [00:39<03:02, 12.31it/s] 18%|█▊        | 486/2736 [00:39<03:02, 12.32it/s] 18%|█▊        | 488/2736 [00:39<03:01, 12.35it/s] 18%|█▊        | 490/2736 [00:39<03:02, 12.30it/s] 18%|█▊        | 492/2736 [00:39<03:01, 12.39it/s] 18%|█▊        | 494/2736 [00:40<03:01, 12.34it/s] 18%|█▊        | 496/2736 [00:40<03:02, 12.29it/s] 18%|█▊        | 498/2736 [00:40<03:02, 12.25it/s] 18%|█▊        | 500/2736 [00:40<03:01, 12.29it/s] 18%|█▊        | 502/2736 [00:40<03:00, 12.35it/s] 18%|█▊        | 504/2736 [00:40<03:01, 12.30it/s] 18%|█▊        | 506/2736 [00:41<03:00, 12.37it/s] 19%|█▊        | 508/2736 [00:41<03:02, 12.24it/s] 19%|█▊        | 510/2736 [00:41<03:00, 12.35it/s] 19%|█▊        | 512/2736 [00:41<03:01, 12.28it/s] 19%|█▉        | 514/2736 [00:41<03:01, 12.27it/s] 19%|█▉        | 516/2736 [00:41<02:59, 12.34it/s] 19%|█▉        | 518/2736 [00:41<02:59, 12.34it/s] 19%|█▉        | 520/2736 [00:42<02:58, 12.41it/s] 19%|█▉        | 522/2736 [00:42<02:59, 12.37it/s] 19%|█▉        | 524/2736 [00:42<02:57, 12.48it/s] 19%|█▉        | 526/2736 [00:42<02:56, 12.50it/s] 19%|█▉        | 528/2736 [00:42<02:57, 12.44it/s] 19%|█▉        | 530/2736 [00:42<02:56, 12.53it/s] 19%|█▉        | 532/2736 [00:43<02:55, 12.56it/s] 20%|█▉        | 534/2736 [00:43<02:56, 12.45it/s] 20%|█▉        | 536/2736 [00:43<02:56, 12.46it/s] 20%|█▉        | 538/2736 [00:43<02:57, 12.39it/s] 20%|█▉        | 540/2736 [00:43<02:56, 12.43it/s] 20%|█▉        | 542/2736 [00:43<02:57, 12.38it/s] 20%|█▉        | 544/2736 [00:44<02:57, 12.36it/s] 20%|█▉        | 546/2736 [00:44<02:56, 12.39it/s] 20%|██        | 548/2736 [00:44<02:56, 12.39it/s] 20%|██        | 550/2736 [00:44<02:56, 12.39it/s] 20%|██        | 552/2736 [00:44<02:57, 12.33it/s] 20%|██        | 554/2736 [00:44<02:57, 12.27it/s] 20%|██        | 556/2736 [00:45<02:55, 12.40it/s] 20%|██        | 558/2736 [00:45<02:55, 12.39it/s] 20%|██        | 560/2736 [00:45<02:55, 12.43it/s] 21%|██        | 562/2736 [00:45<02:55, 12.39it/s] 21%|██        | 564/2736 [00:45<02:54, 12.44it/s] 21%|██        | 566/2736 [00:45<02:55, 12.40it/s] 21%|██        | 568/2736 [00:46<02:54, 12.45it/s] 21%|██        | 570/2736 [00:46<02:55, 12.35it/s] 21%|██        | 572/2736 [00:46<02:53, 12.44it/s] 21%|██        | 574/2736 [00:46<02:54, 12.37it/s] 21%|██        | 576/2736 [00:46<02:53, 12.45it/s] 21%|██        | 578/2736 [00:46<02:54, 12.40it/s] 21%|██        | 580/2736 [00:46<02:54, 12.34it/s] 21%|██▏       | 582/2736 [00:47<02:53, 12.43it/s] 21%|██▏       | 584/2736 [00:47<02:54, 12.35it/s] 21%|██▏       | 586/2736 [00:47<02:53, 12.40it/s] 21%|██▏       | 588/2736 [00:47<02:54, 12.32it/s] 22%|██▏       | 590/2736 [00:47<02:55, 12.26it/s] 22%|██▏       | 592/2736 [00:47<02:53, 12.38it/s] 22%|██▏       | 594/2736 [00:48<02:53, 12.32it/s] 22%|██▏       | 596/2736 [00:48<02:54, 12.27it/s] 22%|██▏       | 598/2736 [00:48<02:52, 12.39it/s] 22%|██▏       | 600/2736 [00:48<02:53, 12.32it/s] 22%|██▏       | 602/2736 [00:48<02:52, 12.35it/s] 22%|██▏       | 604/2736 [00:48<02:52, 12.39it/s] 22%|██▏       | 606/2736 [00:49<02:51, 12.41it/s] 22%|██▏       | 608/2736 [00:49<02:51, 12.42it/s] 22%|██▏       | 610/2736 [00:49<02:50, 12.46it/s] 22%|██▏       | 612/2736 [00:49<02:50, 12.42it/s] 22%|██▏       | 614/2736 [00:49<02:50, 12.44it/s] 23%|██▎       | 616/2736 [00:49<02:51, 12.35it/s] 23%|██▎       | 618/2736 [00:50<02:50, 12.44it/s] 23%|██▎       | 620/2736 [00:50<02:51, 12.36it/s] 23%|██▎       | 622/2736 [00:50<02:49, 12.46it/s] 23%|██▎       | 624/2736 [00:50<02:50, 12.37it/s] 23%|██▎       | 626/2736 [00:50<02:51, 12.33it/s] 23%|██▎       | 628/2736 [00:50<02:49, 12.41it/s] 23%|██▎       | 630/2736 [00:51<02:50, 12.34it/s] 23%|██▎       | 632/2736 [00:51<02:50, 12.34it/s] 23%|██▎       | 634/2736 [00:51<02:49, 12.39it/s] 23%|██▎       | 636/2736 [00:51<02:49, 12.36it/s] 23%|██▎       | 638/2736 [00:51<02:48, 12.42it/s] 23%|██▎       | 640/2736 [00:51<02:49, 12.34it/s] 23%|██▎       | 642/2736 [00:51<02:48, 12.45it/s] 24%|██▎       | 644/2736 [00:52<02:49, 12.37it/s] 24%|██▎       | 646/2736 [00:52<02:47, 12.49it/s] 24%|██▎       | 648/2736 [00:52<02:48, 12.39it/s] 24%|██▍       | 650/2736 [00:52<02:47, 12.45it/s] 24%|██▍       | 652/2736 [00:52<02:48, 12.36it/s] 24%|██▍       | 654/2736 [00:52<02:49, 12.31it/s] 24%|██▍       | 656/2736 [00:53<02:47, 12.40it/s] 24%|██▍       | 658/2736 [00:53<02:47, 12.38it/s] 24%|██▍       | 660/2736 [00:53<02:47, 12.43it/s] 24%|██▍       | 662/2736 [00:53<02:48, 12.34it/s] 24%|██▍       | 664/2736 [00:53<02:46, 12.42it/s] 24%|██▍       | 666/2736 [00:53<02:47, 12.32it/s] 24%|██▍       | 668/2736 [00:54<02:47, 12.33it/s] 24%|██▍       | 670/2736 [00:54<02:47, 12.37it/s] 25%|██▍       | 672/2736 [00:54<02:47, 12.31it/s] 25%|██▍       | 674/2736 [00:54<02:47, 12.32it/s] 25%|██▍       | 676/2736 [00:54<02:46, 12.36it/s] 25%|██▍       | 678/2736 [00:54<02:45, 12.44it/s] 25%|██▍       | 680/2736 [00:55<02:46, 12.37it/s] 25%|██▍       | 682/2736 [00:55<02:46, 12.36it/s] 25%|██▌       | 684/2736 [00:55<02:45, 12.38it/s] 25%|██▌       | 686/2736 [00:55<02:45, 12.37it/s] 25%|██▌       | 688/2736 [00:55<02:45, 12.39it/s] 25%|██▌       | 690/2736 [00:55<02:45, 12.33it/s] 25%|██▌       | 692/2736 [00:56<02:45, 12.37it/s] 25%|██▌       | 694/2736 [00:56<02:45, 12.35it/s] 25%|██▌       | 696/2736 [00:56<02:42, 12.53it/s] 26%|██▌       | 698/2736 [00:56<02:33, 13.32it/s] 26%|██▌       | 700/2736 [00:56<02:37, 12.95it/s] 26%|██▌       | 702/2736 [00:56<02:38, 12.87it/s] 26%|██▌       | 704/2736 [00:56<02:40, 12.65it/s] 26%|██▌       | 706/2736 [00:57<02:40, 12.62it/s] 26%|██▌       | 708/2736 [00:57<02:42, 12.47it/s] 26%|██▌       | 710/2736 [00:57<02:41, 12.53it/s] 26%|██▌       | 712/2736 [00:57<02:42, 12.43it/s] 26%|██▌       | 714/2736 [00:57<02:42, 12.41it/s] 26%|██▌       | 716/2736 [00:57<02:42, 12.43it/s] 26%|██▌       | 718/2736 [00:58<02:43, 12.34it/s] 26%|██▋       | 720/2736 [00:58<02:43, 12.29it/s] 26%|██▋       | 722/2736 [00:58<02:42, 12.37it/s] 26%|██▋       | 724/2736 [00:58<02:43, 12.31it/s] 27%|██▋       | 726/2736 [00:58<02:42, 12.35it/s] 27%|██▋       | 728/2736 [00:58<02:42, 12.39it/s] 27%|██▋       | 730/2736 [00:59<02:42, 12.32it/s] 27%|██▋       | 732/2736 [00:59<02:43, 12.26it/s] 27%|██▋       | 734/2736 [00:59<02:41, 12.37it/s] 27%|██▋       | 736/2736 [00:59<02:42, 12.33it/s] 27%|██▋       | 738/2736 [00:59<02:42, 12.28it/s] 27%|██▋       | 740/2736 [00:59<02:43, 12.24it/s] 27%|██▋       | 742/2736 [01:00<02:41, 12.33it/s] 27%|██▋       | 744/2736 [01:00<02:41, 12.31it/s] 27%|██▋       | 746/2736 [01:00<02:40, 12.43it/s] 27%|██▋       | 748/2736 [01:00<02:41, 12.33it/s] 27%|██▋       | 750/2736 [01:00<02:37, 12.58it/s] 27%|██▋       | 752/2736 [01:00<02:29, 13.26it/s] 28%|██▊       | 754/2736 [01:00<02:30, 13.16it/s] 28%|██▊       | 756/2736 [01:01<02:34, 12.84it/s] 28%|██▊       | 758/2736 [01:01<02:34, 12.81it/s] 28%|██▊       | 760/2736 [01:01<02:36, 12.66it/s] 28%|██▊       | 762/2736 [01:01<02:36, 12.65it/s] 28%|██▊       | 764/2736 [01:01<02:36, 12.60it/s] 28%|██▊       | 766/2736 [01:01<02:36, 12.58it/s] 28%|██▊       | 768/2736 [01:02<02:36, 12.54it/s] 28%|██▊       | 770/2736 [01:02<02:36, 12.52it/s] 28%|██▊       | 772/2736 [01:02<02:36, 12.56it/s] 28%|██▊       | 774/2736 [01:02<02:36, 12.53it/s] 28%|██▊       | 776/2736 [01:02<02:36, 12.51it/s] 28%|██▊       | 778/2736 [01:02<02:36, 12.52it/s] 29%|██▊       | 780/2736 [01:03<02:36, 12.46it/s] 29%|██▊       | 782/2736 [01:03<02:36, 12.47it/s] 29%|██▊       | 784/2736 [01:03<02:36, 12.46it/s] 29%|██▊       | 786/2736 [01:03<02:36, 12.44it/s] 29%|██▉       | 788/2736 [01:03<02:36, 12.45it/s] 29%|██▉       | 790/2736 [01:03<02:35, 12.53it/s] 29%|██▉       | 792/2736 [01:04<02:36, 12.42it/s] 29%|██▉       | 794/2736 [01:04<02:35, 12.47it/s] 29%|██▉       | 796/2736 [01:04<02:36, 12.39it/s] 29%|██▉       | 798/2736 [01:04<02:36, 12.39it/s] 29%|██▉       | 800/2736 [01:04<02:36, 12.38it/s] 29%|██▉       | 802/2736 [01:04<02:36, 12.32it/s] 29%|██▉       | 804/2736 [01:05<02:36, 12.32it/s] 29%|██▉       | 806/2736 [01:05<02:27, 13.04it/s] 30%|██▉       | 808/2736 [01:05<02:25, 13.24it/s] 30%|██▉       | 810/2736 [01:05<02:29, 12.89it/s] 30%|██▉       | 812/2736 [01:05<02:31, 12.71it/s] 30%|██▉       | 814/2736 [01:05<02:31, 12.66it/s] 30%|██▉       | 816/2736 [01:05<02:33, 12.50it/s] 30%|██▉       | 818/2736 [01:06<02:34, 12.40it/s] 30%|██▉       | 820/2736 [01:06<02:33, 12.47it/s] 30%|███       | 822/2736 [01:06<02:34, 12.38it/s] 30%|███       | 824/2736 [01:06<02:34, 12.38it/s] 30%|███       | 826/2736 [01:06<02:33, 12.42it/s] 30%|███       | 828/2736 [01:06<02:33, 12.46it/s] 30%|███       | 830/2736 [01:07<02:34, 12.37it/s] 30%|███       | 832/2736 [01:07<02:33, 12.38it/s] 30%|███       | 834/2736 [01:07<02:33, 12.40it/s] 31%|███       | 836/2736 [01:07<02:33, 12.38it/s] 31%|███       | 838/2736 [01:07<02:33, 12.37it/s] 31%|███       | 840/2736 [01:07<02:33, 12.33it/s] 31%|███       | 842/2736 [01:08<02:34, 12.24it/s] 31%|███       | 844/2736 [01:08<02:34, 12.21it/s] 31%|███       | 846/2736 [01:08<02:33, 12.31it/s] 31%|███       | 848/2736 [01:08<02:33, 12.27it/s] 31%|███       | 850/2736 [01:08<02:34, 12.24it/s] 31%|███       | 852/2736 [01:08<02:32, 12.35it/s] 31%|███       | 854/2736 [01:09<02:33, 12.29it/s] 31%|███▏      | 856/2736 [01:09<02:33, 12.27it/s] 31%|███▏      | 858/2736 [01:09<02:33, 12.22it/s] 31%|███▏      | 860/2736 [01:09<02:24, 12.96it/s] 32%|███▏      | 862/2736 [01:09<02:21, 13.28it/s] 32%|███▏      | 864/2736 [01:09<02:24, 12.99it/s] 32%|███▏      | 866/2736 [01:09<02:27, 12.72it/s] 32%|███▏      | 868/2736 [01:10<02:27, 12.63it/s] 32%|███▏      | 870/2736 [01:10<02:28, 12.58it/s] 32%|███▏      | 872/2736 [01:10<02:29, 12.43it/s] 32%|███▏      | 874/2736 [01:10<02:29, 12.48it/s] 32%|███▏      | 876/2736 [01:10<02:30, 12.36it/s] 32%|███▏      | 878/2736 [01:10<02:29, 12.42it/s] 32%|███▏      | 880/2736 [01:11<02:30, 12.34it/s] 32%|███▏      | 882/2736 [01:11<02:31, 12.26it/s] 32%|███▏      | 884/2736 [01:11<02:29, 12.37it/s] 32%|███▏      | 886/2736 [01:11<02:30, 12.31it/s] 32%|███▏      | 888/2736 [01:11<02:30, 12.27it/s] 33%|███▎      | 890/2736 [01:11<02:30, 12.23it/s] 33%|███▎      | 892/2736 [01:12<02:30, 12.21it/s] 33%|███▎      | 894/2736 [01:12<02:29, 12.35it/s] 33%|███▎      | 896/2736 [01:12<02:29, 12.31it/s] 33%|███▎      | 898/2736 [01:12<02:28, 12.36it/s] 33%|███▎      | 900/2736 [01:12<02:28, 12.35it/s] 33%|███▎      | 902/2736 [01:12<02:29, 12.30it/s] 33%|███▎      | 904/2736 [01:13<02:27, 12.40it/s] 33%|███▎      | 906/2736 [01:13<02:28, 12.32it/s] 33%|███▎      | 908/2736 [01:13<02:27, 12.40it/s] 33%|███▎      | 910/2736 [01:13<02:28, 12.32it/s] 33%|███▎      | 912/2736 [01:13<02:27, 12.36it/s]
-  0%|          | 0/126 [00:00<?, ?it/s][A
-  1%|          | 1/126 [00:01<02:40,  1.29s/it][A
-  2%|▏         | 2/126 [00:02<02:36,  1.26s/it][A
-  2%|▏         | 3/126 [00:03<02:34,  1.26s/it][A
-  3%|▎         | 4/126 [00:05<02:32,  1.25s/it][A
-  4%|▍         | 5/126 [00:06<02:30,  1.24s/it][A
-  5%|▍         | 6/126 [00:07<02:28,  1.24s/it][A
-  6%|▌         | 7/126 [00:08<02:27,  1.24s/it][A
-  6%|▋         | 8/126 [00:09<02:26,  1.24s/it][A
-  7%|▋         | 9/126 [00:11<02:24,  1.24s/it][A
-  8%|▊         | 10/126 [00:12<02:23,  1.24s/it][A
-  9%|▊         | 11/126 [00:13<02:22,  1.24s/it][A 33%|███▎      | 912/2736 [01:27<02:27, 12.36it/s]
- 10%|▉         | 12/126 [00:14<02:20,  1.24s/it][A
- 10%|█         | 13/126 [00:16<02:19,  1.24s/it][A
- 11%|█         | 14/126 [00:17<02:18,  1.23s/it][A
- 12%|█▏        | 15/126 [00:18<02:17,  1.24s/it][A
- 13%|█▎        | 16/126 [00:19<02:15,  1.24s/it][A
- 13%|█▎        | 17/126 [00:21<02:14,  1.24s/it][A
- 14%|█▍        | 18/126 [00:22<02:13,  1.24s/it][A
- 15%|█▌        | 19/126 [00:23<02:12,  1.24s/it][A
- 16%|█▌        | 20/126 [00:24<02:11,  1.24s/it][A
- 17%|█▋        | 21/126 [00:26<02:09,  1.24s/it][A
- 17%|█▋        | 22/126 [00:27<02:08,  1.24s/it][A
- 18%|█▊        | 23/126 [00:28<02:07,  1.24s/it][A
- 19%|█▉        | 24/126 [00:29<02:06,  1.24s/it][A
- 20%|█▉        | 25/126 [00:30<02:04,  1.24s/it][A
- 21%|██        | 26/126 [00:32<02:03,  1.24s/it][A
- 21%|██▏       | 27/126 [00:33<02:02,  1.24s/it][A
- 22%|██▏       | 28/126 [00:34<02:01,  1.24s/it][A
- 23%|██▎       | 29/126 [00:35<02:00,  1.24s/it][A
- 24%|██▍       | 30/126 [00:37<01:58,  1.24s/it][A
- 25%|██▍       | 31/126 [00:38<01:57,  1.24s/it][A
- 25%|██▌       | 32/126 [00:39<01:56,  1.24s/it][A
- 26%|██▌       | 33/126 [00:40<01:55,  1.24s/it][A
- 27%|██▋       | 34/126 [00:42<01:53,  1.24s/it][A
- 28%|██▊       | 35/126 [00:43<01:52,  1.24s/it][A
- 29%|██▊       | 36/126 [00:44<01:51,  1.24s/it][A
- 29%|██▉       | 37/126 [00:45<01:50,  1.24s/it][A
- 30%|███       | 38/126 [00:47<01:48,  1.24s/it][A
- 31%|███       | 39/126 [00:48<01:47,  1.24s/it][A
- 32%|███▏      | 40/126 [00:49<01:46,  1.24s/it][A
- 33%|███▎      | 41/126 [00:50<01:45,  1.24s/it][A
- 33%|███▎      | 42/126 [00:52<01:44,  1.24s/it][A
- 34%|███▍      | 43/126 [00:53<01:42,  1.24s/it][A
- 35%|███▍      | 44/126 [00:54<01:41,  1.24s/it][A
- 36%|███▌      | 45/126 [00:55<01:40,  1.24s/it][A
- 37%|███▋      | 46/126 [00:56<01:39,  1.24s/it][A
- 37%|███▋      | 47/126 [00:58<01:37,  1.24s/it][A
- 38%|███▊      | 48/126 [00:59<01:36,  1.24s/it][A
- 39%|███▉      | 49/126 [01:00<01:35,  1.24s/it][A
- 40%|███▉      | 50/126 [01:01<01:34,  1.24s/it][A
- 40%|████      | 51/126 [01:03<01:32,  1.24s/it][A
- 41%|████▏     | 52/126 [01:04<01:31,  1.24s/it][A
- 42%|████▏     | 53/126 [01:05<01:30,  1.24s/it][A
- 43%|████▎     | 54/126 [01:06<01:29,  1.24s/it][A
- 44%|████▎     | 55/126 [01:08<01:27,  1.24s/it][A
- 44%|████▍     | 56/126 [01:09<01:26,  1.24s/it][A
- 45%|████▌     | 57/126 [01:10<01:25,  1.24s/it][A
- 46%|████▌     | 58/126 [01:11<01:24,  1.24s/it][A
- 47%|████▋     | 59/126 [01:13<01:22,  1.24s/it][A
- 48%|████▊     | 60/126 [01:14<01:21,  1.24s/it][A
- 48%|████▊     | 61/126 [01:15<01:20,  1.24s/it][A
- 49%|████▉     | 62/126 [01:16<01:19,  1.24s/it][A
- 50%|█████     | 63/126 [01:18<01:17,  1.24s/it][A
- 51%|█████     | 64/126 [01:19<01:16,  1.24s/it][A
- 52%|█████▏    | 65/126 [01:20<01:15,  1.24s/it][A
- 52%|█████▏    | 66/126 [01:21<01:14,  1.24s/it][A
- 53%|█████▎    | 67/126 [01:22<01:13,  1.24s/it][A
- 54%|█████▍    | 68/126 [01:24<01:11,  1.24s/it][A
- 55%|█████▍    | 69/126 [01:25<01:10,  1.24s/it][A
- 56%|█████▌    | 70/126 [01:26<01:08,  1.23s/it][A
- 56%|█████▋    | 71/126 [01:27<01:07,  1.22s/it][A
- 57%|█████▋    | 72/126 [01:29<01:05,  1.21s/it][A
- 58%|█████▊    | 73/126 [01:30<01:04,  1.21s/it][A
- 59%|█████▊    | 74/126 [01:31<01:02,  1.20s/it][A
- 60%|█████▉    | 75/126 [01:32<01:01,  1.20s/it][A
- 60%|██████    | 76/126 [01:33<01:00,  1.20s/it][A
- 61%|██████    | 77/126 [01:35<00:58,  1.20s/it][A
- 62%|██████▏   | 78/126 [01:36<00:57,  1.20s/it][A
- 63%|██████▎   | 79/126 [01:37<00:56,  1.20s/it][A
- 63%|██████▎   | 80/126 [01:38<00:55,  1.20s/it][A
- 64%|██████▍   | 81/126 [01:39<00:53,  1.20s/it][A
- 65%|██████▌   | 82/126 [01:41<00:52,  1.20s/it][A
- 66%|██████▌   | 83/126 [01:42<00:51,  1.20s/it][A
- 67%|██████▋   | 84/126 [01:43<00:50,  1.20s/it][A
- 67%|██████▋   | 85/126 [01:44<00:49,  1.20s/it][A
- 68%|██████▊   | 86/126 [01:45<00:47,  1.20s/it][A
- 69%|██████▉   | 87/126 [01:47<00:46,  1.20s/it][A
- 70%|██████▉   | 88/126 [01:48<00:45,  1.20s/it][A
- 71%|███████   | 89/126 [01:49<00:44,  1.20s/it][A
- 71%|███████▏  | 90/126 [01:50<00:43,  1.20s/it][A
- 72%|███████▏  | 91/126 [01:51<00:41,  1.20s/it][A
- 73%|███████▎  | 92/126 [01:53<00:40,  1.20s/it][A
- 74%|███████▍  | 93/126 [01:54<00:39,  1.20s/it][A
- 75%|███████▍  | 94/126 [01:55<00:38,  1.20s/it][A
- 75%|███████▌  | 95/126 [01:56<00:37,  1.20s/it][A
- 76%|███████▌  | 96/126 [01:57<00:35,  1.20s/it][A
- 77%|███████▋  | 97/126 [01:59<00:34,  1.20s/it][A
- 78%|███████▊  | 98/126 [02:00<00:33,  1.20s/it][A
- 79%|███████▊  | 99/126 [02:01<00:32,  1.20s/it][A
- 79%|███████▉  | 100/126 [02:02<00:31,  1.20s/it][A
- 80%|████████  | 101/126 [02:03<00:29,  1.20s/it][A
- 81%|████████  | 102/126 [02:05<00:28,  1.20s/it][A
- 82%|████████▏ | 103/126 [02:06<00:27,  1.20s/it][A
- 83%|████████▎ | 104/126 [02:07<00:26,  1.20s/it][A
- 83%|████████▎ | 105/126 [02:08<00:25,  1.20s/it][A
- 84%|████████▍ | 106/126 [02:09<00:23,  1.20s/it][A
- 85%|████████▍ | 107/126 [02:11<00:22,  1.20s/it][A
- 86%|████████▌ | 108/126 [02:12<00:21,  1.20s/it][A
- 87%|████████▋ | 109/126 [02:13<00:20,  1.21s/it][A
- 87%|████████▋ | 110/126 [02:14<00:19,  1.22s/it][A
- 88%|████████▊ | 111/126 [02:15<00:18,  1.22s/it][A
- 89%|████████▉ | 112/126 [02:17<00:17,  1.23s/it][A
- 90%|████████▉ | 113/126 [02:18<00:16,  1.23s/it][A
- 90%|█████████ | 114/126 [02:19<00:14,  1.23s/it][A
- 91%|█████████▏| 115/126 [02:20<00:13,  1.24s/it][A
- 92%|█████████▏| 116/126 [02:22<00:12,  1.24s/it][A
- 93%|█████████▎| 117/126 [02:23<00:11,  1.24s/it][A
- 94%|█████████▎| 118/126 [02:24<00:09,  1.24s/it][A
- 94%|█████████▍| 119/126 [02:25<00:08,  1.24s/it][A
- 95%|█████████▌| 120/126 [02:27<00:07,  1.24s/it][A
- 96%|█████████▌| 121/126 [02:28<00:06,  1.24s/it][A
- 97%|█████████▋| 122/126 [02:29<00:04,  1.24s/it][A
- 98%|█████████▊| 123/126 [02:30<00:03,  1.24s/it][A
- 98%|█████████▊| 124/126 [02:32<00:02,  1.24s/it][A 98%|█████████▊| 124/126 [02:32<00:02,  1.23s/it]
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 217, in <module>
-    for batch in tqdm(eval_dataloader):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/tqdm/std.py", line 1178, in __iter__
-    for obj in iterable:
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/accelerate/data_loader.py", line 394, in __iter__
-    next_batch = next(dataloader_iter)
-                 ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 633, in __next__
-    data = self._next_data()
-           ^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 677, in _next_data
-    data = self._dataset_fetcher.fetch(index)  # may raise StopIteration
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/_utils/fetch.py", line 54, in fetch
-    return self.collate_fn(data)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/data/data_collator.py", line 600, in __call__
-    decoder_input_ids = self.model.prepare_decoder_input_ids_from_labels(labels=features["labels"])
-                        ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/marian/modeling_marian.py", line 1527, in prepare_decoder_input_ids_from_labels
-    return shift_tokens_right(labels, self.config.pad_token_id, self.config.decoder_start_token_id)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/marian/modeling_marian.py", line 66, in shift_tokens_right
-    shifted_input_ids[:, 0] = decoder_start_token_id
-    ~~~~~~~~~~~~~~~~~^^^^^^
-IndexError: index 0 is out of bounds for dimension 1 with size 0
- 33%|███▎      | 912/2736 [03:45<07:31,  4.04it/s]
diff --git a/myerrors_1564.out b/myerrors_1564.out
deleted file mode 100644
index 0e1bedd4886c3dc4cf46438aaf215abe70343958..0000000000000000000000000000000000000000
--- a/myerrors_1564.out
+++ /dev/null
@@ -1,161 +0,0 @@
-You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:32,  2.29s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.15s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.59s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.85s/it] 38%|███▊      | 6/16 [00:21<00:40,  4.01s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.12s/it] 50%|█████     | 8/16 [00:30<00:33,  4.18s/it] 56%|█████▋    | 9/16 [00:34<00:29,  4.23s/it] 62%|██████▎   | 10/16 [00:39<00:25,  4.26s/it] 69%|██████▉   | 11/16 [00:43<00:21,  4.28s/it] 75%|███████▌  | 12/16 [00:47<00:17,  4.29s/it] 81%|████████▏ | 13/16 [00:52<00:12,  4.31s/it] 88%|████████▊ | 14/16 [00:56<00:08,  4.31s/it] 94%|█████████▍| 15/16 [01:00<00:04,  4.32s/it]100%|██████████| 16/16 [01:03<00:00,  3.94s/it]100%|██████████| 16/16 [01:04<00:00,  4.02s/it]
-  0%|          | 0/684 [00:00<?, ?it/s]  0%|          | 1/684 [00:00<02:38,  4.31it/s]  0%|          | 3/684 [00:00<01:17,  8.82it/s]  1%|          | 5/684 [00:00<01:02, 10.82it/s]  1%|          | 7/684 [00:00<00:57, 11.88it/s]  1%|▏         | 9/684 [00:00<00:53, 12.54it/s]  2%|▏         | 11/684 [00:00<00:52, 12.94it/s]  2%|▏         | 13/684 [00:01<00:51, 13.15it/s]  2%|▏         | 15/684 [00:01<00:50, 13.32it/s]  2%|▏         | 17/684 [00:01<00:49, 13.49it/s]  3%|▎         | 19/684 [00:01<00:49, 13.57it/s]  3%|▎         | 21/684 [00:01<00:48, 13.58it/s]  3%|▎         | 23/684 [00:01<00:48, 13.64it/s]  4%|▎         | 25/684 [00:01<00:48, 13.71it/s]  4%|▍         | 27/684 [00:02<00:47, 13.74it/s]  4%|▍         | 29/684 [00:02<00:47, 13.69it/s]  5%|▍         | 31/684 [00:02<00:47, 13.78it/s]  5%|▍         | 33/684 [00:02<00:47, 13.80it/s]  5%|▌         | 35/684 [00:02<00:47, 13.76it/s]  5%|▌         | 37/684 [00:02<00:47, 13.76it/s]  6%|▌         | 39/684 [00:02<00:46, 13.73it/s]  6%|▌         | 41/684 [00:03<00:46, 13.74it/s]  6%|▋         | 43/684 [00:03<00:46, 13.71it/s]  7%|▋         | 45/684 [00:03<00:46, 13.77it/s]  7%|▋         | 47/684 [00:03<00:46, 13.68it/s]  7%|▋         | 49/684 [00:03<00:46, 13.77it/s]  7%|▋         | 51/684 [00:03<00:45, 13.79it/s]  8%|▊         | 53/684 [00:04<00:45, 13.81it/s]  8%|▊         | 55/684 [00:04<00:45, 13.78it/s]  8%|▊         | 57/684 [00:04<00:45, 13.77it/s]  9%|▊         | 59/684 [00:04<00:45, 13.73it/s]  9%|▉         | 61/684 [00:04<00:45, 13.72it/s]  9%|▉         | 63/684 [00:04<00:45, 13.74it/s] 10%|▉         | 65/684 [00:04<00:44, 13.76it/s] 10%|▉         | 67/684 [00:05<00:44, 13.77it/s] 10%|█         | 69/684 [00:05<00:44, 13.78it/s] 10%|█         | 71/684 [00:05<00:44, 13.76it/s] 11%|█         | 73/684 [00:05<00:44, 13.76it/s] 11%|█         | 75/684 [00:05<00:44, 13.78it/s] 11%|█▏        | 77/684 [00:05<00:44, 13.76it/s] 12%|█▏        | 79/684 [00:05<00:43, 13.76it/s] 12%|█▏        | 81/684 [00:06<00:43, 13.77it/s] 12%|█▏        | 83/684 [00:06<00:43, 13.76it/s] 12%|█▏        | 85/684 [00:06<00:43, 13.75it/s] 13%|█▎        | 87/684 [00:06<00:43, 13.79it/s] 13%|█▎        | 89/684 [00:06<00:43, 13.76it/s] 13%|█▎        | 91/684 [00:06<00:43, 13.74it/s] 14%|█▎        | 93/684 [00:06<00:43, 13.74it/s] 14%|█▍        | 95/684 [00:07<00:42, 13.79it/s] 14%|█▍        | 97/684 [00:07<00:42, 13.75it/s] 14%|█▍        | 99/684 [00:07<00:42, 13.77it/s] 15%|█▍        | 101/684 [00:07<00:42, 13.76it/s] 15%|█▌        | 103/684 [00:07<00:42, 13.68it/s] 15%|█▌        | 105/684 [00:07<00:42, 13.78it/s] 16%|█▌        | 107/684 [00:07<00:41, 13.83it/s] 16%|█▌        | 109/684 [00:08<00:41, 13.74it/s] 16%|█▌        | 111/684 [00:08<00:41, 13.76it/s] 17%|█▋        | 113/684 [00:08<00:41, 13.81it/s] 17%|█▋        | 115/684 [00:08<00:41, 13.81it/s] 17%|█▋        | 117/684 [00:08<00:41, 13.79it/s] 17%|█▋        | 119/684 [00:08<00:41, 13.76it/s] 18%|█▊        | 121/684 [00:08<00:41, 13.73it/s] 18%|█▊        | 123/684 [00:09<00:40, 13.76it/s] 18%|█▊        | 125/684 [00:09<00:40, 13.76it/s] 19%|█▊        | 127/684 [00:09<00:40, 13.70it/s] 19%|█▉        | 129/684 [00:09<00:40, 13.74it/s] 19%|█▉        | 131/684 [00:09<00:40, 13.76it/s] 19%|█▉        | 133/684 [00:09<00:40, 13.70it/s] 20%|█▉        | 135/684 [00:09<00:40, 13.72it/s] 20%|██        | 137/684 [00:10<00:39, 13.74it/s] 20%|██        | 139/684 [00:10<00:39, 13.78it/s] 21%|██        | 141/684 [00:10<00:39, 13.78it/s] 21%|██        | 143/684 [00:10<00:39, 13.81it/s] 21%|██        | 145/684 [00:10<00:39, 13.79it/s] 21%|██▏       | 147/684 [00:10<00:39, 13.76it/s] 22%|██▏       | 149/684 [00:10<00:38, 13.78it/s] 22%|██▏       | 151/684 [00:11<00:38, 13.80it/s] 22%|██▏       | 153/684 [00:11<00:38, 13.79it/s] 23%|██▎       | 155/684 [00:11<00:38, 13.78it/s] 23%|██▎       | 157/684 [00:11<00:38, 13.76it/s] 23%|██▎       | 159/684 [00:11<00:38, 13.74it/s] 24%|██▎       | 161/684 [00:11<00:38, 13.72it/s] 24%|██▍       | 163/684 [00:12<00:37, 13.74it/s] 24%|██▍       | 165/684 [00:12<00:37, 13.69it/s] 24%|██▍       | 167/684 [00:12<00:37, 13.69it/s] 25%|██▍       | 169/684 [00:12<00:37, 13.72it/s] 25%|██▌       | 171/684 [00:12<00:37, 13.76it/s] 25%|██▌       | 173/684 [00:12<00:37, 13.74it/s] 26%|██▌       | 175/684 [00:12<00:36, 13.78it/s] 26%|██▌       | 177/684 [00:13<00:36, 13.76it/s] 26%|██▌       | 179/684 [00:13<00:36, 13.76it/s] 26%|██▋       | 181/684 [00:13<00:36, 13.79it/s] 27%|██▋       | 183/684 [00:13<00:36, 13.82it/s] 27%|██▋       | 185/684 [00:13<00:36, 13.80it/s] 27%|██▋       | 187/684 [00:13<00:35, 13.90it/s] 28%|██▊       | 189/684 [00:13<00:35, 14.01it/s] 28%|██▊       | 191/684 [00:14<00:35, 13.91it/s] 28%|██▊       | 193/684 [00:14<00:35, 13.88it/s] 29%|██▊       | 195/684 [00:14<00:35, 13.85it/s] 29%|██▉       | 197/684 [00:14<00:35, 13.77it/s] 29%|██▉       | 199/684 [00:14<00:35, 13.79it/s] 29%|██▉       | 201/684 [00:14<00:35, 13.72it/s] 30%|██▉       | 203/684 [00:14<00:34, 13.76it/s] 30%|██▉       | 205/684 [00:15<00:34, 13.77it/s] 30%|███       | 207/684 [00:15<00:34, 13.76it/s] 31%|███       | 209/684 [00:15<00:34, 13.72it/s] 31%|███       | 211/684 [00:15<00:34, 13.74it/s] 31%|███       | 213/684 [00:15<00:34, 13.74it/s] 31%|███▏      | 215/684 [00:15<00:34, 13.79it/s] 32%|███▏      | 217/684 [00:15<00:33, 13.82it/s] 32%|███▏      | 219/684 [00:16<00:33, 13.80it/s] 32%|███▏      | 221/684 [00:16<00:33, 13.79it/s] 33%|███▎      | 223/684 [00:16<00:33, 13.77it/s] 33%|███▎      | 225/684 [00:16<00:33, 13.75it/s] 33%|███▎      | 227/684 [00:16<00:33, 13.72it/s] 33%|███▎      | 229/684 [00:19<03:06,  2.43it/s] 34%|███▍      | 231/684 [00:19<02:19,  3.24it/s] 34%|███▍      | 233/684 [00:19<01:47,  4.21it/s] 34%|███▍      | 235/684 [00:19<01:24,  5.33it/s] 35%|███▍      | 237/684 [00:19<01:08,  6.50it/s] 35%|███▍      | 239/684 [00:19<00:59,  7.53it/s] 35%|███▌      | 241/684 [00:19<00:50,  8.72it/s] 36%|███▌      | 243/684 [00:20<00:46,  9.51it/s] 36%|███▌      | 245/684 [00:20<00:41, 10.56it/s] 36%|███▌      | 247/684 [00:20<00:38, 11.48it/s] 36%|███▋      | 249/684 [00:20<00:37, 11.74it/s] 37%|███▋      | 251/684 [00:20<00:35, 12.10it/s] 37%|███▋      | 253/684 [00:20<00:34, 12.50it/s] 37%|███▋      | 255/684 [00:21<00:34, 12.45it/s] 38%|███▊      | 257/684 [00:21<00:33, 12.84it/s] 38%|███▊      | 259/684 [00:21<00:32, 13.18it/s] 38%|███▊      | 261/684 [00:21<00:32, 12.98it/s] 38%|███▊      | 263/684 [00:21<00:31, 13.16it/s] 39%|███▊      | 265/684 [00:21<00:32, 12.88it/s] 39%|███▉      | 267/684 [00:21<00:32, 12.88it/s] 39%|███▉      | 269/684 [00:22<00:32, 12.92it/s] 40%|███▉      | 271/684 [00:22<00:31, 12.94it/s] 40%|███▉      | 273/684 [00:22<00:31, 13.00it/s] 40%|████      | 275/684 [00:22<00:32, 12.76it/s] 40%|████      | 277/684 [00:22<00:31, 13.11it/s] 41%|████      | 279/684 [00:22<00:31, 12.92it/s] 41%|████      | 281/684 [00:22<00:30, 13.14it/s] 41%|████▏     | 283/684 [00:23<00:29, 13.38it/s] 42%|████▏     | 285/684 [00:23<00:30, 13.18it/s] 42%|████▏     | 287/684 [00:23<00:30, 13.23it/s] 42%|████▏     | 289/684 [00:23<00:30, 13.00it/s] 43%|████▎     | 291/684 [00:23<00:29, 13.19it/s] 43%|████▎     | 293/684 [00:23<00:30, 12.88it/s] 43%|████▎     | 295/684 [00:24<00:29, 13.30it/s] 43%|████▎     | 297/684 [00:24<00:29, 13.08it/s] 44%|████▎     | 299/684 [00:24<00:29, 13.24it/s] 44%|████▍     | 301/684 [00:24<00:29, 13.08it/s] 44%|████▍     | 303/684 [00:24<00:28, 13.17it/s] 45%|████▍     | 305/684 [00:24<00:28, 13.44it/s] 45%|████▍     | 307/684 [00:24<00:28, 13.05it/s] 45%|████▌     | 309/684 [00:25<00:28, 13.09it/s] 45%|████▌     | 311/684 [00:25<00:28, 12.95it/s] 46%|████▌     | 313/684 [00:25<00:27, 13.31it/s] 46%|████▌     | 315/684 [00:25<00:27, 13.53it/s] 46%|████▋     | 317/684 [00:25<00:26, 13.69it/s] 47%|████▋     | 319/684 [00:25<00:27, 13.35it/s] 47%|████▋     | 321/684 [00:26<00:27, 13.34it/s] 47%|████▋     | 323/684 [00:26<00:27, 13.18it/s] 48%|████▊     | 325/684 [00:26<00:27, 13.28it/s] 48%|████▊     | 327/684 [00:26<00:26, 13.39it/s] 48%|████▊     | 329/684 [00:26<00:27, 13.11it/s] 48%|████▊     | 331/684 [00:26<00:26, 13.30it/s] 49%|████▊     | 333/684 [00:26<00:26, 13.49it/s] 49%|████▉     | 335/684 [00:27<00:25, 13.62it/s] 49%|████▉     | 337/684 [00:27<00:25, 13.76it/s] 50%|████▉     | 339/684 [00:27<00:24, 13.83it/s] 50%|████▉     | 341/684 [00:27<00:24, 13.87it/s] 50%|█████     | 343/684 [00:27<00:24, 13.92it/s] 50%|█████     | 345/684 [00:27<00:24, 13.95it/s] 51%|█████     | 347/684 [00:27<00:24, 13.97it/s] 51%|█████     | 349/684 [00:28<00:23, 13.97it/s] 51%|█████▏    | 351/684 [00:28<00:23, 13.99it/s] 52%|█████▏    | 353/684 [00:28<00:23, 13.97it/s] 52%|█████▏    | 355/684 [00:28<00:23, 13.99it/s] 52%|█████▏    | 357/684 [00:28<00:23, 14.00it/s] 52%|█████▏    | 359/684 [00:28<00:23, 13.99it/s] 53%|█████▎    | 361/684 [00:28<00:23, 14.01it/s] 53%|█████▎    | 363/684 [00:29<00:22, 14.04it/s] 53%|█████▎    | 365/684 [00:29<00:22, 14.00it/s] 54%|█████▎    | 367/684 [00:29<00:22, 14.00it/s] 54%|█████▍    | 369/684 [00:29<00:22, 14.03it/s] 54%|█████▍    | 371/684 [00:29<00:22, 14.04it/s] 55%|█████▍    | 373/684 [00:29<00:22, 14.00it/s] 55%|█████▍    | 375/684 [00:29<00:22, 14.04it/s] 55%|█████▌    | 377/684 [00:30<00:21, 14.01it/s] 55%|█████▌    | 379/684 [00:30<00:21, 14.01it/s] 56%|█████▌    | 381/684 [00:30<00:21, 14.03it/s] 56%|█████▌    | 383/684 [00:30<00:21, 14.05it/s] 56%|█████▋    | 385/684 [00:30<00:21, 14.07it/s] 57%|█████▋    | 387/684 [00:30<00:21, 14.05it/s] 57%|█████▋    | 389/684 [00:30<00:21, 14.04it/s] 57%|█████▋    | 391/684 [00:31<00:20, 14.06it/s] 57%|█████▋    | 393/684 [00:31<00:20, 14.04it/s] 58%|█████▊    | 395/684 [00:31<00:20, 14.05it/s] 58%|█████▊    | 397/684 [00:31<00:20, 14.00it/s] 58%|█████▊    | 399/684 [00:31<00:20, 14.03it/s] 59%|█████▊    | 401/684 [00:31<00:20, 14.04it/s] 59%|█████▉    | 403/684 [00:31<00:20, 14.03it/s] 59%|█████▉    | 405/684 [00:32<00:19, 14.03it/s] 60%|█████▉    | 407/684 [00:32<00:19, 14.02it/s] 60%|█████▉    | 409/684 [00:32<00:19, 14.01it/s] 60%|██████    | 411/684 [00:32<00:19, 14.01it/s] 60%|██████    | 413/684 [00:32<00:19, 14.02it/s] 61%|██████    | 415/684 [00:32<00:19, 14.04it/s] 61%|██████    | 417/684 [00:32<00:19, 14.00it/s] 61%|██████▏   | 419/684 [00:33<00:18, 14.02it/s] 62%|██████▏   | 421/684 [00:33<00:18, 14.04it/s] 62%|██████▏   | 423/684 [00:33<00:18, 14.04it/s] 62%|██████▏   | 425/684 [00:33<00:18, 14.04it/s] 62%|██████▏   | 427/684 [00:33<00:18, 14.03it/s] 63%|██████▎   | 429/684 [00:33<00:18, 14.03it/s] 63%|██████▎   | 431/684 [00:33<00:17, 14.06it/s] 63%|██████▎   | 433/684 [00:34<00:17, 14.04it/s] 64%|██████▎   | 435/684 [00:34<00:17, 14.05it/s] 64%|██████▍   | 437/684 [00:34<00:17, 14.06it/s] 64%|██████▍   | 439/684 [00:34<00:17, 14.04it/s] 64%|██████▍   | 441/684 [00:34<00:17, 14.04it/s] 65%|██████▍   | 443/684 [00:34<00:17, 14.03it/s] 65%|██████▌   | 445/684 [00:34<00:17, 14.03it/s] 65%|██████▌   | 447/684 [00:35<00:16, 14.05it/s] 66%|██████▌   | 449/684 [00:35<00:16, 14.04it/s] 66%|██████▌   | 451/684 [00:35<00:16, 14.05it/s] 66%|██████▌   | 453/684 [00:35<00:16, 14.04it/s] 67%|██████▋   | 455/684 [00:35<00:16, 14.04it/s] 67%|██████▋   | 457/684 [00:37<01:32,  2.46it/s] 67%|██████▋   | 459/684 [00:38<01:08,  3.26it/s] 67%|██████▋   | 461/684 [00:38<00:52,  4.25it/s] 68%|██████▊   | 463/684 [00:38<00:41,  5.37it/s] 68%|██████▊   | 465/684 [00:38<00:33,  6.52it/s] 68%|██████▊   | 467/684 [00:38<00:28,  7.65it/s] 69%|██████▊   | 469/684 [00:38<00:24,  8.70it/s] 69%|██████▉   | 471/684 [00:39<00:21,  9.75it/s] 69%|██████▉   | 473/684 [00:39<00:20, 10.45it/s] 69%|██████▉   | 475/684 [00:39<00:18, 11.16it/s] 70%|██████▉   | 477/684 [00:39<00:17, 11.70it/s] 70%|███████   | 479/684 [00:39<00:17, 11.93it/s] 70%|███████   | 481/684 [00:39<00:16, 12.38it/s] 71%|███████   | 483/684 [00:39<00:16, 12.40it/s] 71%|███████   | 485/684 [00:40<00:15, 12.77it/s] 71%|███████   | 487/684 [00:40<00:15, 12.71it/s] 71%|███████▏  | 489/684 [00:40<00:15, 12.92it/s] 72%|███████▏  | 491/684 [00:40<00:15, 12.71it/s] 72%|███████▏  | 493/684 [00:40<00:14, 12.90it/s] 72%|███████▏  | 495/684 [00:40<00:14, 12.79it/s] 73%|███████▎  | 497/684 [00:41<00:14, 12.73it/s] 73%|███████▎  | 499/684 [00:41<00:14, 12.89it/s]                                                  73%|███████▎  | 500/684 [00:41<00:14, 12.89it/s] 73%|███████▎  | 501/684 [00:41<00:14, 12.80it/s] 74%|███████▎  | 503/684 [00:41<00:13, 13.07it/s] 74%|███████▍  | 505/684 [00:41<00:13, 12.84it/s] 74%|███████▍  | 507/684 [00:41<00:13, 12.65it/s] 74%|███████▍  | 509/684 [00:41<00:13, 12.93it/s] 75%|███████▍  | 511/684 [00:42<00:13, 12.84it/s] 75%|███████▌  | 513/684 [00:42<00:13, 12.85it/s] 75%|███████▌  | 515/684 [00:42<00:12, 13.07it/s] 76%|███████▌  | 517/684 [00:42<00:13, 12.72it/s] 76%|███████▌  | 519/684 [00:42<00:12, 12.94it/s] 76%|███████▌  | 521/684 [00:42<00:12, 12.83it/s] 76%|███████▋  | 523/684 [00:43<00:12, 13.07it/s] 77%|███████▋  | 525/684 [00:43<00:12, 12.95it/s] 77%|███████▋  | 527/684 [00:43<00:11, 13.21it/s] 77%|███████▋  | 529/684 [00:43<00:11, 12.94it/s] 78%|███████▊  | 531/684 [00:43<00:11, 12.88it/s] 78%|███████▊  | 533/684 [00:43<00:11, 13.08it/s] 78%|███████▊  | 535/684 [00:43<00:11, 13.27it/s] 79%|███████▊  | 537/684 [00:44<00:11, 13.34it/s] 79%|███████▉  | 539/684 [00:44<00:10, 13.48it/s] 79%|███████▉  | 541/684 [00:44<00:10, 13.61it/s] 79%|███████▉  | 543/684 [00:44<00:10, 13.76it/s] 80%|███████▉  | 545/684 [00:44<00:10, 13.83it/s] 80%|███████▉  | 547/684 [00:44<00:09, 13.85it/s] 80%|████████  | 549/684 [00:44<00:09, 13.93it/s] 81%|████████  | 551/684 [00:45<00:09, 13.96it/s] 81%|████████  | 553/684 [00:45<00:09, 13.97it/s] 81%|████████  | 555/684 [00:45<00:09, 13.99it/s] 81%|████████▏ | 557/684 [00:45<00:09, 14.01it/s] 82%|████████▏ | 559/684 [00:45<00:08, 14.03it/s] 82%|████████▏ | 561/684 [00:45<00:08, 13.99it/s] 82%|████████▏ | 563/684 [00:45<00:08, 14.02it/s] 83%|████████▎ | 565/684 [00:46<00:08, 14.03it/s] 83%|████████▎ | 567/684 [00:46<00:08, 14.04it/s] 83%|████████▎ | 569/684 [00:46<00:08, 14.03it/s] 83%|████████▎ | 571/684 [00:46<00:08, 14.04it/s] 84%|████████▍ | 573/684 [00:46<00:07, 14.05it/s] 84%|████████▍ | 575/684 [00:46<00:07, 14.06it/s] 84%|████████▍ | 577/684 [00:46<00:07, 14.17it/s] 85%|████████▍ | 579/684 [00:47<00:07, 14.17it/s] 85%|████████▍ | 581/684 [00:47<00:07, 14.17it/s] 85%|████████▌ | 583/684 [00:47<00:07, 14.14it/s] 86%|████████▌ | 585/684 [00:47<00:07, 14.10it/s] 86%|████████▌ | 587/684 [00:47<00:06, 14.08it/s] 86%|████████▌ | 589/684 [00:47<00:06, 14.08it/s] 86%|████████▋ | 591/684 [00:47<00:06, 14.09it/s] 87%|████████▋ | 593/684 [00:48<00:06, 14.10it/s] 87%|████████▋ | 595/684 [00:48<00:06, 14.07it/s] 87%|████████▋ | 597/684 [00:48<00:06, 14.08it/s] 88%|████████▊ | 599/684 [00:48<00:06, 14.06it/s] 88%|████████▊ | 601/684 [00:48<00:05, 14.14it/s] 88%|████████▊ | 603/684 [00:48<00:05, 14.14it/s] 88%|████████▊ | 605/684 [00:48<00:05, 14.15it/s] 89%|████████▊ | 607/684 [00:49<00:05, 14.16it/s] 89%|████████▉ | 609/684 [00:49<00:05, 14.17it/s] 89%|████████▉ | 611/684 [00:49<00:05, 14.15it/s] 90%|████████▉ | 613/684 [00:49<00:05, 14.12it/s] 90%|████████▉ | 615/684 [00:49<00:04, 14.11it/s] 90%|█████████ | 617/684 [00:49<00:04, 14.10it/s] 90%|█████████ | 619/684 [00:49<00:04, 14.08it/s] 91%|█████████ | 621/684 [00:50<00:04, 14.07it/s] 91%|█████████ | 623/684 [00:50<00:04, 14.07it/s] 91%|█████████▏| 625/684 [00:50<00:04, 14.06it/s] 92%|█████████▏| 627/684 [00:50<00:04, 14.05it/s] 92%|█████████▏| 629/684 [00:50<00:03, 14.04it/s] 92%|█████████▏| 631/684 [00:50<00:03, 14.03it/s] 93%|█████████▎| 633/684 [00:50<00:03, 14.04it/s] 93%|█████████▎| 635/684 [00:51<00:03, 14.02it/s] 93%|█████████▎| 637/684 [00:51<00:03, 14.04it/s] 93%|█████████▎| 639/684 [00:51<00:03, 14.03it/s] 94%|█████████▎| 641/684 [00:51<00:03, 14.01it/s] 94%|█████████▍| 643/684 [00:51<00:02, 14.03it/s] 94%|█████████▍| 645/684 [00:51<00:02, 14.06it/s] 95%|█████████▍| 647/684 [00:51<00:02, 14.08it/s] 95%|█████████▍| 649/684 [00:52<00:02, 14.11it/s] 95%|█████████▌| 651/684 [00:52<00:02, 14.13it/s] 95%|█████████▌| 653/684 [00:52<00:02, 14.09it/s] 96%|█████████▌| 655/684 [00:52<00:02, 14.08it/s] 96%|█████████▌| 657/684 [00:52<00:01, 14.08it/s] 96%|█████████▋| 659/684 [00:52<00:01, 14.06it/s] 97%|█████████▋| 661/684 [00:52<00:01, 14.08it/s] 97%|█████████▋| 663/684 [00:53<00:01, 14.08it/s] 97%|█████████▋| 665/684 [00:53<00:01, 14.06it/s] 98%|█████████▊| 667/684 [00:53<00:01, 14.10it/s] 98%|█████████▊| 669/684 [00:53<00:01, 14.09it/s] 98%|█████████▊| 671/684 [00:53<00:00, 14.09it/s] 98%|█████████▊| 673/684 [00:53<00:00, 14.09it/s] 99%|█████████▊| 675/684 [00:53<00:00, 14.08it/s] 99%|█████████▉| 677/684 [00:54<00:00, 14.07it/s] 99%|█████████▉| 679/684 [00:54<00:00, 14.06it/s]100%|█████████▉| 681/684 [00:54<00:00, 14.07it/s]100%|█████████▉| 683/684 [00:54<00:00, 14.02it/s]                                                 100%|██████████| 684/684 [00:56<00:00, 14.02it/s]100%|██████████| 684/684 [00:56<00:00, 12.04it/s]
-  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:30,  2.17s/it] 19%|█▉        | 3/16 [00:08<00:39,  3.08s/it] 25%|██▌       | 4/16 [00:13<00:42,  3.54s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.85s/it] 38%|███▊      | 6/16 [00:21<00:40,  4.03s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.14s/it] 50%|█████     | 8/16 [00:30<00:33,  4.21s/it] 56%|█████▋    | 9/16 [00:34<00:29,  4.27s/it] 62%|██████▎   | 10/16 [00:39<00:25,  4.30s/it] 69%|██████▉   | 11/16 [00:43<00:21,  4.32s/it] 75%|███████▌  | 12/16 [00:48<00:17,  4.34s/it] 81%|████████▏ | 13/16 [00:52<00:13,  4.35s/it] 88%|████████▊ | 14/16 [00:56<00:08,  4.36s/it] 94%|█████████▍| 15/16 [01:01<00:04,  4.36s/it]100%|██████████| 16/16 [01:04<00:00,  3.98s/it]100%|██████████| 16/16 [01:05<00:00,  4.10s/it]
-/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/optimization.py:411: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning
-  warnings.warn(
-/mnt/storage/aatherton/hf_eng_fra_trans is already a clone of https://huggingface.co/aatherton2024/hf_eng_fra_trans. Make sure you pull the latest changes with `repo.git_pull()`.
-  0%|          | 0/2736 [00:00<?, ?it/s]  0%|          | 1/2736 [00:00<04:35,  9.94it/s]  0%|          | 3/2736 [00:00<03:57, 11.52it/s]  0%|          | 5/2736 [00:00<03:49, 11.91it/s]  0%|          | 7/2736 [00:00<03:36, 12.59it/s]  0%|          | 9/2736 [00:00<03:38, 12.48it/s]  0%|          | 11/2736 [00:00<03:37, 12.50it/s]  0%|          | 13/2736 [00:01<03:39, 12.41it/s]  1%|          | 15/2736 [00:01<03:40, 12.33it/s]  1%|          | 17/2736 [00:01<03:39, 12.38it/s]  1%|          | 19/2736 [00:01<03:38, 12.44it/s]  1%|          | 21/2736 [00:01<03:38, 12.44it/s]  1%|          | 23/2736 [00:01<03:40, 12.29it/s]  1%|          | 25/2736 [00:02<03:38, 12.40it/s]  1%|          | 27/2736 [00:02<03:39, 12.34it/s]  1%|          | 29/2736 [00:02<03:38, 12.38it/s]  1%|          | 31/2736 [00:02<03:37, 12.44it/s]  1%|          | 33/2736 [00:02<03:41, 12.18it/s]  1%|▏         | 35/2736 [00:02<03:43, 12.10it/s]  1%|▏         | 37/2736 [00:03<03:40, 12.23it/s]  1%|▏         | 39/2736 [00:03<03:40, 12.25it/s]  1%|▏         | 41/2736 [00:03<03:37, 12.36it/s]  2%|▏         | 43/2736 [00:03<03:36, 12.42it/s]  2%|▏         | 45/2736 [00:03<03:36, 12.44it/s]  2%|▏         | 47/2736 [00:03<03:35, 12.50it/s]  2%|▏         | 49/2736 [00:03<03:34, 12.53it/s]  2%|▏         | 51/2736 [00:04<03:34, 12.51it/s]  2%|▏         | 53/2736 [00:04<03:34, 12.52it/s]  2%|▏         | 55/2736 [00:04<03:34, 12.51it/s]  2%|▏         | 57/2736 [00:04<03:35, 12.45it/s]  2%|▏         | 59/2736 [00:04<03:36, 12.37it/s]  2%|▏         | 61/2736 [00:04<03:37, 12.28it/s]  2%|▏         | 63/2736 [00:05<03:37, 12.29it/s]  2%|▏         | 65/2736 [00:05<03:36, 12.35it/s]  2%|▏         | 67/2736 [00:05<03:37, 12.28it/s]  3%|▎         | 69/2736 [00:05<03:35, 12.35it/s]  3%|▎         | 71/2736 [00:05<03:36, 12.32it/s]  3%|▎         | 73/2736 [00:05<03:36, 12.28it/s]  3%|▎         | 75/2736 [00:06<03:34, 12.39it/s]  3%|▎         | 77/2736 [00:06<03:36, 12.31it/s]  3%|▎         | 79/2736 [00:06<03:34, 12.39it/s]  3%|▎         | 81/2736 [00:06<03:34, 12.40it/s]  3%|▎         | 83/2736 [00:06<03:33, 12.40it/s]  3%|▎         | 85/2736 [00:06<03:36, 12.26it/s]  3%|▎         | 87/2736 [00:07<03:34, 12.34it/s]  3%|▎         | 89/2736 [00:07<03:35, 12.30it/s]  3%|▎         | 91/2736 [00:07<03:33, 12.37it/s]  3%|▎         | 93/2736 [00:07<03:33, 12.40it/s]  3%|▎         | 95/2736 [00:07<03:33, 12.39it/s]  4%|▎         | 97/2736 [00:07<03:32, 12.41it/s]  4%|▎         | 99/2736 [00:08<03:31, 12.45it/s]  4%|▎         | 101/2736 [00:08<03:30, 12.51it/s]  4%|▍         | 103/2736 [00:08<03:30, 12.50it/s]  4%|▍         | 105/2736 [00:08<03:29, 12.54it/s]  4%|▍         | 107/2736 [00:08<03:29, 12.55it/s]  4%|▍         | 109/2736 [00:08<03:29, 12.55it/s]  4%|▍         | 111/2736 [00:08<03:28, 12.57it/s]  4%|▍         | 113/2736 [00:09<03:29, 12.54it/s]  4%|▍         | 115/2736 [00:09<03:29, 12.54it/s]  4%|▍         | 117/2736 [00:09<03:28, 12.54it/s]  4%|▍         | 119/2736 [00:09<03:29, 12.51it/s]  4%|▍         | 121/2736 [00:09<03:28, 12.55it/s]  4%|▍         | 123/2736 [00:09<03:28, 12.52it/s]  5%|▍         | 125/2736 [00:10<03:28, 12.53it/s]  5%|▍         | 127/2736 [00:10<03:28, 12.53it/s]  5%|▍         | 129/2736 [00:10<03:27, 12.55it/s]  5%|▍         | 131/2736 [00:10<03:27, 12.56it/s]  5%|▍         | 133/2736 [00:10<03:28, 12.51it/s]  5%|▍         | 135/2736 [00:10<03:26, 12.57it/s]  5%|▌         | 137/2736 [00:11<03:26, 12.58it/s]  5%|▌         | 139/2736 [00:11<03:26, 12.60it/s]  5%|▌         | 141/2736 [00:11<03:25, 12.61it/s]  5%|▌         | 143/2736 [00:11<03:26, 12.55it/s]  5%|▌         | 145/2736 [00:11<03:26, 12.55it/s]  5%|▌         | 147/2736 [00:11<03:26, 12.51it/s]  5%|▌         | 149/2736 [00:11<03:26, 12.53it/s]  6%|▌         | 151/2736 [00:12<03:26, 12.53it/s]  6%|▌         | 153/2736 [00:12<03:25, 12.56it/s]  6%|▌         | 155/2736 [00:12<03:25, 12.55it/s]  6%|▌         | 157/2736 [00:12<03:25, 12.55it/s]  6%|▌         | 159/2736 [00:12<03:26, 12.48it/s]  6%|▌         | 161/2736 [00:12<03:25, 12.54it/s]  6%|▌         | 163/2736 [00:13<03:26, 12.45it/s]  6%|▌         | 165/2736 [00:13<03:25, 12.50it/s]  6%|▌         | 167/2736 [00:13<03:27, 12.37it/s]  6%|▌         | 169/2736 [00:13<03:26, 12.45it/s]  6%|▋         | 171/2736 [00:13<03:26, 12.40it/s]  6%|▋         | 173/2736 [00:13<03:25, 12.49it/s]  6%|▋         | 175/2736 [00:14<03:26, 12.38it/s]  6%|▋         | 177/2736 [00:14<03:26, 12.42it/s]  7%|▋         | 179/2736 [00:14<03:25, 12.43it/s]  7%|▋         | 181/2736 [00:14<03:24, 12.51it/s]  7%|▋         | 183/2736 [00:14<03:23, 12.52it/s]  7%|▋         | 185/2736 [00:14<03:25, 12.42it/s]  7%|▋         | 187/2736 [00:15<03:24, 12.45it/s]  7%|▋         | 189/2736 [00:15<03:25, 12.42it/s]  7%|▋         | 191/2736 [00:15<03:23, 12.50it/s]  7%|▋         | 193/2736 [00:15<03:24, 12.41it/s]  7%|▋         | 195/2736 [00:15<03:24, 12.43it/s]  7%|▋         | 197/2736 [00:15<03:24, 12.41it/s]  7%|▋         | 199/2736 [00:16<03:24, 12.40it/s]  7%|▋         | 201/2736 [00:16<03:23, 12.44it/s]  7%|▋         | 203/2736 [00:16<03:25, 12.31it/s]  7%|▋         | 205/2736 [00:16<03:25, 12.35it/s]  8%|▊         | 207/2736 [00:16<03:24, 12.37it/s]  8%|▊         | 209/2736 [00:16<03:23, 12.43it/s]  8%|▊         | 211/2736 [00:16<03:23, 12.39it/s]  8%|▊         | 213/2736 [00:17<03:25, 12.30it/s]  8%|▊         | 215/2736 [00:17<03:23, 12.40it/s]  8%|▊         | 217/2736 [00:17<03:24, 12.35it/s]  8%|▊         | 219/2736 [00:17<03:22, 12.44it/s]  8%|▊         | 221/2736 [00:17<03:22, 12.42it/s]  8%|▊         | 223/2736 [00:17<03:22, 12.43it/s]  8%|▊         | 225/2736 [00:18<03:20, 12.52it/s]  8%|▊         | 227/2736 [00:18<03:21, 12.45it/s]  8%|▊         | 229/2736 [00:18<03:20, 12.52it/s]  8%|▊         | 231/2736 [00:18<03:20, 12.48it/s]  9%|▊         | 233/2736 [00:18<03:20, 12.48it/s]  9%|▊         | 235/2736 [00:18<03:19, 12.52it/s]  9%|▊         | 237/2736 [00:19<03:20, 12.45it/s]  9%|▊         | 239/2736 [00:19<03:21, 12.37it/s]  9%|▉         | 241/2736 [00:19<03:20, 12.44it/s]  9%|▉         | 243/2736 [00:19<03:21, 12.40it/s]  9%|▉         | 245/2736 [00:19<03:20, 12.45it/s]  9%|▉         | 247/2736 [00:19<03:20, 12.44it/s]  9%|▉         | 249/2736 [00:20<03:19, 12.44it/s]  9%|▉         | 251/2736 [00:20<03:21, 12.35it/s]  9%|▉         | 253/2736 [00:20<03:20, 12.40it/s]  9%|▉         | 255/2736 [00:20<03:21, 12.31it/s]  9%|▉         | 257/2736 [00:20<03:21, 12.29it/s]  9%|▉         | 259/2736 [00:20<03:21, 12.32it/s] 10%|▉         | 261/2736 [00:21<03:20, 12.32it/s] 10%|▉         | 263/2736 [00:21<03:20, 12.31it/s] 10%|▉         | 265/2736 [00:21<03:19, 12.38it/s] 10%|▉         | 267/2736 [00:21<03:21, 12.28it/s] 10%|▉         | 269/2736 [00:21<03:21, 12.23it/s] 10%|▉         | 271/2736 [00:21<03:19, 12.36it/s] 10%|▉         | 273/2736 [00:21<03:19, 12.33it/s] 10%|█         | 275/2736 [00:22<03:18, 12.42it/s] 10%|█         | 277/2736 [00:22<03:18, 12.41it/s] 10%|█         | 279/2736 [00:22<03:17, 12.45it/s] 10%|█         | 281/2736 [00:22<03:17, 12.44it/s] 10%|█         | 283/2736 [00:22<03:17, 12.44it/s] 10%|█         | 285/2736 [00:22<03:17, 12.40it/s] 10%|█         | 287/2736 [00:23<03:16, 12.45it/s] 11%|█         | 289/2736 [00:23<03:16, 12.48it/s] 11%|█         | 291/2736 [00:23<03:16, 12.46it/s] 11%|█         | 293/2736 [00:23<03:16, 12.43it/s] 11%|█         | 295/2736 [00:23<03:17, 12.38it/s] 11%|█         | 297/2736 [00:23<03:16, 12.39it/s] 11%|█         | 299/2736 [00:24<03:17, 12.33it/s] 11%|█         | 301/2736 [00:24<03:16, 12.37it/s] 11%|█         | 303/2736 [00:24<03:17, 12.33it/s] 11%|█         | 305/2736 [00:24<03:17, 12.30it/s] 11%|█         | 307/2736 [00:24<03:15, 12.40it/s] 11%|█▏        | 309/2736 [00:24<03:14, 12.47it/s] 11%|█▏        | 311/2736 [00:25<03:16, 12.37it/s] 11%|█▏        | 313/2736 [00:25<03:16, 12.31it/s] 12%|█▏        | 315/2736 [00:25<03:15, 12.39it/s] 12%|█▏        | 317/2736 [00:25<03:16, 12.31it/s] 12%|█▏        | 319/2736 [00:25<03:17, 12.23it/s] 12%|█▏        | 321/2736 [00:25<03:15, 12.37it/s] 12%|█▏        | 323/2736 [00:26<03:15, 12.33it/s] 12%|█▏        | 325/2736 [00:26<03:16, 12.25it/s] 12%|█▏        | 327/2736 [00:26<03:16, 12.23it/s] 12%|█▏        | 329/2736 [00:26<03:14, 12.38it/s] 12%|█▏        | 331/2736 [00:26<03:14, 12.35it/s] 12%|█▏        | 333/2736 [00:26<03:15, 12.32it/s] 12%|█▏        | 335/2736 [00:26<03:13, 12.43it/s] 12%|█▏        | 337/2736 [00:27<03:14, 12.36it/s] 12%|█▏        | 339/2736 [00:27<03:12, 12.48it/s] 12%|█▏        | 341/2736 [00:27<03:11, 12.49it/s] 13%|█▎        | 343/2736 [00:27<03:10, 12.55it/s] 13%|█▎        | 345/2736 [00:27<03:10, 12.53it/s] 13%|█▎        | 347/2736 [00:27<03:11, 12.48it/s] 13%|█▎        | 349/2736 [00:28<03:11, 12.47it/s] 13%|█▎        | 351/2736 [00:28<03:09, 12.56it/s] 13%|█▎        | 353/2736 [00:28<03:11, 12.44it/s] 13%|█▎        | 355/2736 [00:28<03:10, 12.49it/s] 13%|█▎        | 357/2736 [00:28<03:11, 12.42it/s] 13%|█▎        | 359/2736 [00:28<03:10, 12.48it/s] 13%|█▎        | 361/2736 [00:29<03:10, 12.48it/s] 13%|█▎        | 363/2736 [00:29<03:10, 12.43it/s] 13%|█▎        | 365/2736 [00:29<03:09, 12.49it/s] 13%|█▎        | 367/2736 [00:29<03:10, 12.41it/s] 13%|█▎        | 369/2736 [00:29<03:10, 12.41it/s] 14%|█▎        | 371/2736 [00:29<03:09, 12.46it/s] 14%|█▎        | 373/2736 [00:30<03:10, 12.43it/s] 14%|█▎        | 375/2736 [00:30<03:09, 12.44it/s] 14%|█▍        | 377/2736 [00:30<03:09, 12.45it/s] 14%|█▍        | 379/2736 [00:30<03:09, 12.42it/s] 14%|█▍        | 381/2736 [00:30<03:10, 12.34it/s] 14%|█▍        | 383/2736 [00:30<03:09, 12.41it/s] 14%|█▍        | 385/2736 [00:31<03:10, 12.37it/s] 14%|█▍        | 387/2736 [00:31<03:09, 12.36it/s] 14%|█▍        | 389/2736 [00:31<03:09, 12.41it/s] 14%|█▍        | 391/2736 [00:31<03:10, 12.34it/s] 14%|█▍        | 393/2736 [00:31<03:08, 12.41it/s] 14%|█▍        | 395/2736 [00:31<03:09, 12.36it/s] 15%|█▍        | 397/2736 [00:31<03:08, 12.43it/s] 15%|█▍        | 399/2736 [00:32<03:08, 12.37it/s] 15%|█▍        | 401/2736 [00:32<03:08, 12.36it/s] 15%|█▍        | 403/2736 [00:32<03:08, 12.36it/s] 15%|█▍        | 405/2736 [00:32<03:08, 12.34it/s] 15%|█▍        | 407/2736 [00:32<03:07, 12.41it/s] 15%|█▍        | 409/2736 [00:32<03:06, 12.49it/s] 15%|█▌        | 411/2736 [00:33<03:05, 12.51it/s] 15%|█▌        | 413/2736 [00:33<03:06, 12.45it/s] 15%|█▌        | 415/2736 [00:33<03:06, 12.42it/s] 15%|█▌        | 417/2736 [00:33<03:06, 12.44it/s] 15%|█▌        | 419/2736 [00:33<03:05, 12.47it/s] 15%|█▌        | 421/2736 [00:33<03:06, 12.40it/s] 15%|█▌        | 423/2736 [00:34<03:06, 12.43it/s] 16%|█▌        | 425/2736 [00:34<03:06, 12.42it/s] 16%|█▌        | 427/2736 [00:34<03:06, 12.40it/s] 16%|█▌        | 429/2736 [00:34<03:05, 12.41it/s] 16%|█▌        | 431/2736 [00:34<03:05, 12.40it/s] 16%|█▌        | 433/2736 [00:34<03:05, 12.43it/s] 16%|█▌        | 435/2736 [00:35<03:05, 12.44it/s] 16%|█▌        | 437/2736 [00:35<03:04, 12.45it/s] 16%|█▌        | 439/2736 [00:35<03:04, 12.46it/s] 16%|█▌        | 441/2736 [00:35<03:04, 12.42it/s] 16%|█▌        | 443/2736 [00:35<03:03, 12.50it/s] 16%|█▋        | 445/2736 [00:35<03:03, 12.51it/s] 16%|█▋        | 447/2736 [00:36<03:04, 12.38it/s] 16%|█▋        | 449/2736 [00:36<03:05, 12.34it/s] 16%|█▋        | 451/2736 [00:36<03:04, 12.38it/s] 17%|█▋        | 453/2736 [00:36<03:03, 12.43it/s] 17%|█▋        | 455/2736 [00:36<03:04, 12.37it/s] 17%|█▋        | 457/2736 [00:36<03:03, 12.40it/s] 17%|█▋        | 459/2736 [00:36<03:04, 12.35it/s] 17%|█▋        | 461/2736 [00:37<03:02, 12.46it/s] 17%|█▋        | 463/2736 [00:37<03:03, 12.38it/s] 17%|█▋        | 465/2736 [00:37<03:02, 12.44it/s] 17%|█▋        | 467/2736 [00:37<03:03, 12.35it/s] 17%|█▋        | 469/2736 [00:37<03:02, 12.41it/s] 17%|█▋        | 471/2736 [00:37<03:03, 12.38it/s] 17%|█▋        | 473/2736 [00:38<03:02, 12.42it/s] 17%|█▋        | 475/2736 [00:38<03:02, 12.36it/s] 17%|█▋        | 477/2736 [00:38<03:02, 12.38it/s] 18%|█▊        | 479/2736 [00:38<03:02, 12.39it/s] 18%|█▊        | 481/2736 [00:38<03:02, 12.34it/s] 18%|█▊        | 483/2736 [00:38<03:01, 12.41it/s] 18%|█▊        | 485/2736 [00:39<03:01, 12.42it/s] 18%|█▊        | 487/2736 [00:39<03:01, 12.39it/s] 18%|█▊        | 489/2736 [00:39<03:00, 12.47it/s] 18%|█▊        | 491/2736 [00:39<03:00, 12.43it/s] 18%|█▊        | 493/2736 [00:39<02:59, 12.47it/s] 18%|█▊        | 495/2736 [00:39<03:00, 12.45it/s] 18%|█▊        | 497/2736 [00:40<02:59, 12.46it/s] 18%|█▊        | 499/2736 [00:40<02:58, 12.50it/s] 18%|█▊        | 501/2736 [00:40<02:59, 12.45it/s] 18%|█▊        | 503/2736 [00:40<02:58, 12.48it/s] 18%|█▊        | 505/2736 [00:40<02:57, 12.56it/s] 19%|█▊        | 507/2736 [00:40<02:57, 12.53it/s] 19%|█▊        | 509/2736 [00:40<02:58, 12.45it/s] 19%|█▊        | 511/2736 [00:41<02:57, 12.50it/s] 19%|█▉        | 513/2736 [00:41<02:58, 12.48it/s] 19%|█▉        | 515/2736 [00:41<02:57, 12.53it/s] 19%|█▉        | 517/2736 [00:41<02:57, 12.53it/s] 19%|█▉        | 519/2736 [00:41<02:56, 12.53it/s] 19%|█▉        | 521/2736 [00:41<02:56, 12.52it/s] 19%|█▉        | 523/2736 [00:42<02:56, 12.54it/s] 19%|█▉        | 525/2736 [00:42<02:57, 12.48it/s] 19%|█▉        | 527/2736 [00:42<02:56, 12.52it/s] 19%|█▉        | 529/2736 [00:42<02:57, 12.44it/s] 19%|█▉        | 531/2736 [00:42<02:56, 12.49it/s] 19%|█▉        | 533/2736 [00:42<02:55, 12.54it/s] 20%|█▉        | 535/2736 [00:43<02:56, 12.44it/s] 20%|█▉        | 537/2736 [00:43<02:56, 12.46it/s] 20%|█▉        | 539/2736 [00:43<02:56, 12.47it/s] 20%|█▉        | 541/2736 [00:43<02:56, 12.41it/s] 20%|█▉        | 543/2736 [00:43<02:56, 12.45it/s] 20%|█▉        | 545/2736 [00:43<02:55, 12.47it/s] 20%|█▉        | 547/2736 [00:44<02:56, 12.42it/s] 20%|██        | 549/2736 [00:44<02:56, 12.41it/s] 20%|██        | 551/2736 [00:44<02:56, 12.41it/s] 20%|██        | 553/2736 [00:44<02:55, 12.43it/s] 20%|██        | 555/2736 [00:44<02:55, 12.40it/s] 20%|██        | 557/2736 [00:44<02:56, 12.33it/s] 20%|██        | 559/2736 [00:45<02:55, 12.39it/s] 21%|██        | 561/2736 [00:45<02:56, 12.33it/s] 21%|██        | 563/2736 [00:45<02:55, 12.41it/s] 21%|██        | 565/2736 [00:45<02:55, 12.37it/s] 21%|██        | 567/2736 [00:45<02:54, 12.43it/s] 21%|██        | 569/2736 [00:45<02:55, 12.36it/s] 21%|██        | 571/2736 [00:45<02:54, 12.41it/s] 21%|██        | 573/2736 [00:46<02:54, 12.38it/s] 21%|██        | 575/2736 [00:46<02:53, 12.48it/s] 21%|██        | 577/2736 [00:46<02:54, 12.34it/s] 21%|██        | 579/2736 [00:46<02:54, 12.33it/s] 21%|██        | 581/2736 [00:46<02:53, 12.42it/s] 21%|██▏       | 583/2736 [00:46<02:54, 12.34it/s] 21%|██▏       | 585/2736 [00:47<02:52, 12.44it/s] 21%|██▏       | 587/2736 [00:47<02:53, 12.36it/s] 22%|██▏       | 589/2736 [00:47<02:52, 12.46it/s] 22%|██▏       | 591/2736 [00:47<02:53, 12.39it/s] 22%|██▏       | 593/2736 [00:47<02:51, 12.49it/s] 22%|██▏       | 595/2736 [00:47<02:51, 12.47it/s] 22%|██▏       | 597/2736 [00:48<02:51, 12.44it/s] 22%|██▏       | 599/2736 [00:48<02:52, 12.40it/s] 22%|██▏       | 601/2736 [00:48<02:52, 12.40it/s] 22%|██▏       | 603/2736 [00:48<02:50, 12.49it/s] 22%|██▏       | 605/2736 [00:48<02:51, 12.40it/s] 22%|██▏       | 607/2736 [00:48<02:51, 12.42it/s] 22%|██▏       | 609/2736 [00:49<02:51, 12.39it/s] 22%|██▏       | 611/2736 [00:49<02:51, 12.41it/s] 22%|██▏       | 613/2736 [00:49<02:51, 12.39it/s] 22%|██▏       | 615/2736 [00:49<02:49, 12.48it/s] 23%|██▎       | 617/2736 [00:49<02:50, 12.44it/s] 23%|██▎       | 619/2736 [00:49<02:49, 12.47it/s] 23%|██▎       | 621/2736 [00:49<02:49, 12.48it/s] 23%|██▎       | 623/2736 [00:50<02:49, 12.46it/s] 23%|██▎       | 625/2736 [00:50<02:49, 12.49it/s] 23%|██▎       | 627/2736 [00:50<02:50, 12.40it/s] 23%|██▎       | 629/2736 [00:50<02:48, 12.48it/s] 23%|██▎       | 631/2736 [00:50<02:48, 12.46it/s] 23%|██▎       | 633/2736 [00:50<02:48, 12.48it/s] 23%|██▎       | 635/2736 [00:51<02:47, 12.51it/s] 23%|██▎       | 637/2736 [00:51<02:48, 12.44it/s] 23%|██▎       | 639/2736 [00:51<02:47, 12.49it/s] 23%|██▎       | 641/2736 [00:51<02:49, 12.38it/s] 24%|██▎       | 643/2736 [00:51<02:47, 12.46it/s] 24%|██▎       | 645/2736 [00:51<02:48, 12.38it/s] 24%|██▎       | 647/2736 [00:52<02:47, 12.45it/s] 24%|██▎       | 649/2736 [00:52<02:48, 12.40it/s] 24%|██▍       | 651/2736 [00:52<02:47, 12.46it/s] 24%|██▍       | 653/2736 [00:52<02:47, 12.41it/s] 24%|██▍       | 655/2736 [00:52<02:46, 12.48it/s] 24%|██▍       | 657/2736 [00:52<02:47, 12.40it/s] 24%|██▍       | 659/2736 [00:53<02:47, 12.40it/s] 24%|██▍       | 661/2736 [00:53<02:46, 12.45it/s] 24%|██▍       | 663/2736 [00:53<02:45, 12.49it/s] 24%|██▍       | 665/2736 [00:53<02:45, 12.53it/s] 24%|██▍       | 667/2736 [00:53<02:46, 12.43it/s] 24%|██▍       | 669/2736 [00:53<02:45, 12.48it/s] 25%|██▍       | 671/2736 [00:54<02:46, 12.40it/s] 25%|██▍       | 673/2736 [00:54<02:45, 12.46it/s] 25%|██▍       | 675/2736 [00:54<02:46, 12.38it/s] 25%|██▍       | 677/2736 [00:54<02:45, 12.42it/s] 25%|██▍       | 679/2736 [00:54<02:46, 12.37it/s] 25%|██▍       | 681/2736 [00:54<02:44, 12.46it/s] 25%|██▍       | 683/2736 [00:54<02:46, 12.37it/s] 25%|██▌       | 685/2736 [00:55<02:44, 12.44it/s] 25%|██▌       | 687/2736 [00:55<02:45, 12.39it/s] 25%|██▌       | 689/2736 [00:55<02:45, 12.36it/s] 25%|██▌       | 691/2736 [00:55<02:44, 12.40it/s] 25%|██▌       | 693/2736 [00:55<02:43, 12.48it/s] 25%|██▌       | 695/2736 [00:55<02:44, 12.39it/s] 25%|██▌       | 697/2736 [00:56<02:44, 12.43it/s] 26%|██▌       | 699/2736 [00:56<02:44, 12.40it/s] 26%|██▌       | 701/2736 [00:56<02:45, 12.33it/s] 26%|██▌       | 703/2736 [00:56<02:43, 12.41it/s] 26%|██▌       | 705/2736 [00:56<02:43, 12.39it/s] 26%|██▌       | 707/2736 [00:56<02:43, 12.42it/s] 26%|██▌       | 709/2736 [00:57<02:43, 12.42it/s] 26%|██▌       | 711/2736 [00:57<02:42, 12.46it/s] 26%|██▌       | 713/2736 [00:57<02:41, 12.49it/s] 26%|██▌       | 715/2736 [00:57<02:41, 12.48it/s] 26%|██▌       | 717/2736 [00:57<02:42, 12.39it/s] 26%|██▋       | 719/2736 [00:57<02:41, 12.46it/s] 26%|██▋       | 721/2736 [00:58<02:42, 12.38it/s] 26%|██▋       | 723/2736 [00:58<02:41, 12.46it/s] 26%|██▋       | 725/2736 [00:58<02:40, 12.52it/s] 27%|██▋       | 727/2736 [00:58<02:41, 12.43it/s] 27%|██▋       | 729/2736 [00:58<02:43, 12.28it/s] 27%|██▋       | 731/2736 [00:58<02:43, 12.26it/s] 27%|██▋       | 733/2736 [00:59<02:43, 12.21it/s] 27%|██▋       | 735/2736 [00:59<02:41, 12.35it/s] 27%|██▋       | 737/2736 [00:59<02:42, 12.33it/s] 27%|██▋       | 739/2736 [00:59<02:40, 12.41it/s] 27%|██▋       | 741/2736 [00:59<02:42, 12.31it/s] 27%|██▋       | 743/2736 [00:59<02:41, 12.36it/s] 27%|██▋       | 745/2736 [00:59<02:41, 12.34it/s] 27%|██▋       | 747/2736 [01:00<02:39, 12.44it/s] 27%|██▋       | 749/2736 [01:00<02:40, 12.37it/s] 27%|██▋       | 751/2736 [01:00<02:39, 12.48it/s] 28%|██▊       | 753/2736 [01:00<02:40, 12.35it/s] 28%|██▊       | 755/2736 [01:00<02:41, 12.29it/s] 28%|██▊       | 757/2736 [01:00<02:40, 12.34it/s] 28%|██▊       | 759/2736 [01:01<02:39, 12.36it/s] 28%|██▊       | 761/2736 [01:01<02:38, 12.43it/s] 28%|██▊       | 763/2736 [01:01<02:39, 12.36it/s] 28%|██▊       | 765/2736 [01:01<02:38, 12.45it/s] 28%|██▊       | 767/2736 [01:01<02:39, 12.36it/s] 28%|██▊       | 769/2736 [01:01<02:37, 12.46it/s] 28%|██▊       | 771/2736 [01:02<02:38, 12.42it/s] 28%|██▊       | 773/2736 [01:02<02:37, 12.45it/s] 28%|██▊       | 775/2736 [01:02<02:37, 12.43it/s] 28%|██▊       | 777/2736 [01:02<02:37, 12.45it/s] 28%|██▊       | 779/2736 [01:02<02:36, 12.52it/s] 29%|██▊       | 781/2736 [01:02<02:36, 12.49it/s] 29%|██▊       | 783/2736 [01:03<02:36, 12.45it/s] 29%|██▊       | 785/2736 [01:03<02:36, 12.49it/s] 29%|██▉       | 787/2736 [01:03<02:36, 12.44it/s] 29%|██▉       | 789/2736 [01:03<02:35, 12.53it/s] 29%|██▉       | 791/2736 [01:03<02:36, 12.44it/s] 29%|██▉       | 793/2736 [01:03<02:35, 12.49it/s] 29%|██▉       | 795/2736 [01:04<02:35, 12.51it/s] 29%|██▉       | 797/2736 [01:04<02:35, 12.44it/s] 29%|██▉       | 799/2736 [01:04<02:34, 12.50it/s] 29%|██▉       | 801/2736 [01:04<02:35, 12.42it/s] 29%|██▉       | 803/2736 [01:04<02:35, 12.47it/s] 29%|██▉       | 805/2736 [01:04<02:34, 12.49it/s] 29%|██▉       | 807/2736 [01:04<02:34, 12.50it/s] 30%|██▉       | 809/2736 [01:05<02:34, 12.50it/s] 30%|██▉       | 811/2736 [01:05<02:33, 12.54it/s] 30%|██▉       | 813/2736 [01:05<02:33, 12.50it/s] 30%|██▉       | 815/2736 [01:05<02:33, 12.52it/s] 30%|██▉       | 817/2736 [01:05<02:32, 12.58it/s] 30%|██▉       | 819/2736 [01:05<02:32, 12.55it/s] 30%|███       | 821/2736 [01:06<02:32, 12.53it/s] 30%|███       | 823/2736 [01:06<02:32, 12.55it/s] 30%|███       | 825/2736 [01:06<02:32, 12.54it/s] 30%|███       | 827/2736 [01:06<02:32, 12.53it/s] 30%|███       | 829/2736 [01:06<02:32, 12.54it/s] 30%|███       | 831/2736 [01:06<02:31, 12.54it/s] 30%|███       | 833/2736 [01:07<02:32, 12.51it/s] 31%|███       | 835/2736 [01:07<02:31, 12.52it/s] 31%|███       | 837/2736 [01:07<02:31, 12.52it/s] 31%|███       | 839/2736 [01:07<02:31, 12.56it/s] 31%|███       | 841/2736 [01:07<02:31, 12.55it/s] 31%|███       | 843/2736 [01:07<02:31, 12.49it/s] 31%|███       | 845/2736 [01:08<02:31, 12.52it/s] 31%|███       | 847/2736 [01:08<02:31, 12.44it/s] 31%|███       | 849/2736 [01:08<02:31, 12.50it/s] 31%|███       | 851/2736 [01:08<02:30, 12.51it/s] 31%|███       | 853/2736 [01:08<02:30, 12.54it/s] 31%|███▏      | 855/2736 [01:08<02:29, 12.54it/s] 31%|███▏      | 857/2736 [01:08<02:29, 12.53it/s] 31%|███▏      | 859/2736 [01:09<02:29, 12.55it/s] 31%|███▏      | 861/2736 [01:09<02:29, 12.52it/s] 32%|███▏      | 863/2736 [01:09<02:29, 12.51it/s] 32%|███▏      | 865/2736 [01:09<02:29, 12.52it/s] 32%|███▏      | 867/2736 [01:09<02:29, 12.54it/s] 32%|███▏      | 869/2736 [01:09<02:28, 12.55it/s] 32%|███▏      | 871/2736 [01:10<02:28, 12.58it/s] 32%|███▏      | 873/2736 [01:10<02:28, 12.54it/s] 32%|███▏      | 875/2736 [01:10<02:30, 12.41it/s] 32%|███▏      | 877/2736 [01:10<02:30, 12.34it/s] 32%|███▏      | 879/2736 [01:10<02:29, 12.43it/s] 32%|███▏      | 881/2736 [01:10<02:30, 12.35it/s] 32%|███▏      | 883/2736 [01:11<02:29, 12.43it/s] 32%|███▏      | 885/2736 [01:11<02:29, 12.41it/s] 32%|███▏      | 887/2736 [01:11<02:28, 12.42it/s] 32%|███▏      | 889/2736 [01:11<02:28, 12.46it/s] 33%|███▎      | 891/2736 [01:11<02:28, 12.42it/s] 33%|███▎      | 893/2736 [01:11<02:27, 12.46it/s] 33%|███▎      | 895/2736 [01:12<02:27, 12.48it/s] 33%|███▎      | 897/2736 [01:12<02:28, 12.42it/s] 33%|███▎      | 899/2736 [01:12<02:27, 12.42it/s] 33%|███▎      | 901/2736 [01:12<02:27, 12.44it/s] 33%|███▎      | 903/2736 [01:12<02:27, 12.44it/s] 33%|███▎      | 905/2736 [01:12<02:27, 12.45it/s] 33%|███▎      | 907/2736 [01:12<02:27, 12.39it/s] 33%|███▎      | 909/2736 [01:13<02:26, 12.46it/s] 33%|███▎      | 911/2736 [01:13<02:26, 12.44it/s]
-  0%|          | 0/126 [00:00<?, ?it/s][A
-  1%|          | 1/126 [00:02<04:43,  2.27s/it][A
-  2%|▏         | 2/126 [00:03<03:28,  1.68s/it][A
-  2%|▏         | 3/126 [00:04<03:02,  1.48s/it][A
-  3%|▎         | 4/126 [00:06<02:49,  1.39s/it][A
-  4%|▍         | 5/126 [00:07<02:41,  1.34s/it][A
-  5%|▍         | 6/126 [00:08<02:36,  1.31s/it][A
-  6%|▌         | 7/126 [00:09<02:33,  1.29s/it][A
-  6%|▋         | 8/126 [00:11<02:31,  1.28s/it][A
-  7%|▋         | 9/126 [00:12<02:28,  1.27s/it][A
-  8%|▊         | 10/126 [00:13<02:26,  1.26s/it][A
-  9%|▊         | 11/126 [00:14<02:24,  1.26s/it][A 33%|███▎      | 912/2736 [01:28<02:26, 12.44it/s]
- 10%|▉         | 12/126 [00:16<02:23,  1.26s/it][A
- 10%|█         | 13/126 [00:17<02:20,  1.25s/it][A
- 11%|█         | 14/126 [00:18<02:18,  1.23s/it][A
- 12%|█▏        | 15/126 [00:19<02:17,  1.24s/it][A
- 13%|█▎        | 16/126 [00:20<02:16,  1.24s/it][A
- 13%|█▎        | 17/126 [00:22<02:15,  1.25s/it][A
- 14%|█▍        | 18/126 [00:23<02:14,  1.25s/it][A
- 15%|█▌        | 19/126 [00:24<02:13,  1.24s/it][A
- 16%|█▌        | 20/126 [00:25<02:11,  1.24s/it][A
- 17%|█▋        | 21/126 [00:27<02:10,  1.24s/it][A
- 17%|█▋        | 22/126 [00:28<02:09,  1.25s/it][A
- 18%|█▊        | 23/126 [00:29<02:08,  1.25s/it][A
- 19%|█▉        | 24/126 [00:30<02:07,  1.25s/it][A
- 20%|█▉        | 25/126 [00:32<02:07,  1.26s/it][A
- 21%|██        | 26/126 [00:33<02:04,  1.24s/it][A
- 21%|██▏       | 27/126 [00:34<02:01,  1.23s/it][A
- 22%|██▏       | 28/126 [00:35<01:59,  1.22s/it][A
- 23%|██▎       | 29/126 [00:37<01:58,  1.22s/it][A
- 24%|██▍       | 30/126 [00:38<01:56,  1.21s/it][A
- 25%|██▍       | 31/126 [00:39<01:55,  1.21s/it][A
- 25%|██▌       | 32/126 [00:40<01:53,  1.21s/it][A
- 26%|██▌       | 33/126 [00:41<01:52,  1.21s/it][A
- 27%|██▋       | 34/126 [00:43<01:50,  1.20s/it][A
- 28%|██▊       | 35/126 [00:44<01:49,  1.20s/it][A
- 29%|██▊       | 36/126 [00:45<01:47,  1.20s/it][A
- 29%|██▉       | 37/126 [00:46<01:46,  1.20s/it][A
- 30%|███       | 38/126 [00:47<01:45,  1.20s/it][A
- 31%|███       | 39/126 [00:49<01:44,  1.20s/it][A
- 32%|███▏      | 40/126 [00:50<01:43,  1.20s/it][A
- 33%|███▎      | 41/126 [00:51<01:42,  1.20s/it][A
- 33%|███▎      | 42/126 [00:52<01:40,  1.20s/it][A
- 34%|███▍      | 43/126 [00:53<01:39,  1.20s/it][A
- 35%|███▍      | 44/126 [00:55<01:38,  1.20s/it][A
- 36%|███▌      | 45/126 [00:56<01:37,  1.20s/it][A
- 37%|███▋      | 46/126 [00:57<01:36,  1.20s/it][A
- 37%|███▋      | 47/126 [00:58<01:34,  1.20s/it][A
- 38%|███▊      | 48/126 [00:59<01:35,  1.23s/it][A
- 39%|███▉      | 49/126 [01:01<01:34,  1.22s/it][A
- 40%|███▉      | 50/126 [01:02<01:32,  1.21s/it][A
- 40%|████      | 51/126 [01:03<01:30,  1.21s/it][A
- 41%|████▏     | 52/126 [01:04<01:29,  1.21s/it][A
- 42%|████▏     | 53/126 [01:05<01:27,  1.20s/it][A
- 43%|████▎     | 54/126 [01:07<01:26,  1.20s/it][A
- 44%|████▎     | 55/126 [01:08<01:25,  1.20s/it][A
- 44%|████▍     | 56/126 [01:09<01:24,  1.20s/it][A
- 45%|████▌     | 57/126 [01:10<01:23,  1.20s/it][A
- 46%|████▌     | 58/126 [01:11<01:21,  1.20s/it][A
- 47%|████▋     | 59/126 [01:13<01:20,  1.20s/it][A
- 48%|████▊     | 60/126 [01:14<01:19,  1.20s/it][A
- 48%|████▊     | 61/126 [01:15<01:18,  1.20s/it][A
- 49%|████▉     | 62/126 [01:16<01:16,  1.20s/it][A
- 50%|█████     | 63/126 [01:17<01:15,  1.20s/it][A
- 51%|█████     | 64/126 [01:19<01:14,  1.20s/it][A
- 52%|█████▏    | 65/126 [01:20<01:13,  1.20s/it][A
- 52%|█████▏    | 66/126 [01:21<01:11,  1.20s/it][A
- 53%|█████▎    | 67/126 [01:22<01:10,  1.20s/it][A
- 54%|█████▍    | 68/126 [01:23<01:09,  1.20s/it][A
- 55%|█████▍    | 69/126 [01:25<01:08,  1.20s/it][A
- 56%|█████▌    | 70/126 [01:26<01:07,  1.20s/it][A
- 56%|█████▋    | 71/126 [01:27<01:05,  1.20s/it][A
- 57%|█████▋    | 72/126 [01:28<01:04,  1.20s/it][A
- 58%|█████▊    | 73/126 [01:29<01:03,  1.20s/it][A
- 59%|█████▊    | 74/126 [01:31<01:02,  1.20s/it][A
- 60%|█████▉    | 75/126 [01:32<01:01,  1.20s/it][A
- 60%|██████    | 76/126 [01:33<00:59,  1.20s/it][A
- 61%|██████    | 77/126 [01:34<00:58,  1.20s/it][A
- 62%|██████▏   | 78/126 [01:35<00:57,  1.20s/it][A
- 63%|██████▎   | 79/126 [01:37<00:56,  1.21s/it][A
- 63%|██████▎   | 80/126 [01:38<00:55,  1.21s/it][A
- 64%|██████▍   | 81/126 [01:39<00:54,  1.20s/it][A
- 65%|██████▌   | 82/126 [01:40<00:52,  1.20s/it][A
- 66%|██████▌   | 83/126 [01:41<00:51,  1.20s/it][A
- 67%|██████▋   | 84/126 [01:43<00:50,  1.20s/it][A
- 67%|██████▋   | 85/126 [01:44<00:49,  1.20s/it][A
- 68%|██████▊   | 86/126 [01:45<00:48,  1.21s/it][A
- 69%|██████▉   | 87/126 [01:46<00:46,  1.20s/it][A
- 70%|██████▉   | 88/126 [01:47<00:45,  1.20s/it][A
- 71%|███████   | 89/126 [01:49<00:44,  1.20s/it][A
- 71%|███████▏  | 90/126 [01:50<00:43,  1.20s/it][A
- 72%|███████▏  | 91/126 [01:51<00:41,  1.20s/it][A
- 73%|███████▎  | 92/126 [01:52<00:40,  1.20s/it][A
- 74%|███████▍  | 93/126 [01:53<00:39,  1.19s/it][A
- 75%|███████▍  | 94/126 [01:55<00:38,  1.19s/it][A
- 75%|███████▌  | 95/126 [01:56<00:37,  1.20s/it][A
- 76%|███████▌  | 96/126 [01:57<00:35,  1.20s/it][A
- 77%|███████▋  | 97/126 [01:58<00:34,  1.20s/it][A
- 78%|███████▊  | 98/126 [01:59<00:33,  1.20s/it][A
- 79%|███████▊  | 99/126 [02:01<00:32,  1.20s/it][A
- 79%|███████▉  | 100/126 [02:02<00:31,  1.20s/it][A
- 80%|████████  | 101/126 [02:03<00:29,  1.20s/it][A
- 81%|████████  | 102/126 [02:04<00:28,  1.20s/it][A
- 82%|████████▏ | 103/126 [02:05<00:27,  1.20s/it][A
- 83%|████████▎ | 104/126 [02:07<00:26,  1.20s/it][A
- 83%|████████▎ | 105/126 [02:08<00:25,  1.20s/it][A
- 84%|████████▍ | 106/126 [02:09<00:23,  1.20s/it][A
- 85%|████████▍ | 107/126 [02:10<00:22,  1.20s/it][A
- 86%|████████▌ | 108/126 [02:11<00:21,  1.20s/it][A
- 87%|████████▋ | 109/126 [02:13<00:20,  1.20s/it][A
- 87%|████████▋ | 110/126 [02:14<00:19,  1.20s/it][A
- 88%|████████▊ | 111/126 [02:15<00:18,  1.20s/it][A
- 89%|████████▉ | 112/126 [02:16<00:16,  1.20s/it][A
- 90%|████████▉ | 113/126 [02:17<00:15,  1.20s/it][A
- 90%|█████████ | 114/126 [02:19<00:14,  1.20s/it][A
- 91%|█████████▏| 115/126 [02:20<00:13,  1.21s/it][A
- 92%|█████████▏| 116/126 [02:21<00:12,  1.21s/it][A
- 93%|█████████▎| 117/126 [02:22<00:10,  1.21s/it][A
- 94%|█████████▎| 118/126 [02:23<00:09,  1.20s/it][A
- 94%|█████████▍| 119/126 [02:25<00:08,  1.20s/it][A
- 95%|█████████▌| 120/126 [02:26<00:07,  1.20s/it][A
- 96%|█████████▌| 121/126 [02:27<00:06,  1.20s/it][A
- 97%|█████████▋| 122/126 [02:28<00:04,  1.20s/it][A
- 98%|█████████▊| 123/126 [02:29<00:03,  1.20s/it][A
- 98%|█████████▊| 124/126 [02:31<00:02,  1.20s/it][A 98%|█████████▊| 124/126 [02:31<00:02,  1.22s/it]
-Traceback (most recent call last):
-  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 217, in <module>
-    for batch in tqdm(eval_dataloader):
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/tqdm/std.py", line 1178, in __iter__
-    for obj in iterable:
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/accelerate/data_loader.py", line 394, in __iter__
-    next_batch = next(dataloader_iter)
-                 ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 633, in __next__
-    data = self._next_data()
-           ^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 677, in _next_data
-    data = self._dataset_fetcher.fetch(index)  # may raise StopIteration
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/torch/utils/data/_utils/fetch.py", line 54, in fetch
-    return self.collate_fn(data)
-           ^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/data/data_collator.py", line 600, in __call__
-    decoder_input_ids = self.model.prepare_decoder_input_ids_from_labels(labels=features["labels"])
-                        ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/marian/modeling_marian.py", line 1527, in prepare_decoder_input_ids_from_labels
-    return shift_tokens_right(labels, self.config.pad_token_id, self.config.decoder_start_token_id)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/marian/modeling_marian.py", line 66, in shift_tokens_right
-    shifted_input_ids[:, 0] = decoder_start_token_id
-    ~~~~~~~~~~~~~~~~~^^^^^^
-IndexError: index 0 is out of bounds for dimension 1 with size 0
- 33%|███▎      | 912/2736 [03:44<07:29,  4.06it/s]
diff --git a/myerrors_1600.out b/myerrors_1600.out
new file mode 100644
index 0000000000000000000000000000000000000000..f379eca7f6f68455bda5040f70e6ff68d7078d37
--- /dev/null
+++ b/myerrors_1600.out
@@ -0,0 +1,49 @@
+You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
+  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:31,  2.29s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.15s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.63s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.90s/it] 38%|███▊      | 6/16 [00:22<00:40,  4.05s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.15s/it] 50%|█████     | 8/16 [00:30<00:33,  4.22s/it] 56%|█████▋    | 9/16 [00:35<00:29,  4.26s/it] 62%|██████▎   | 10/16 [00:39<00:25,  4.30s/it] 69%|██████▉   | 11/16 [00:44<00:21,  4.33s/it] 75%|███████▌  | 12/16 [00:48<00:17,  4.34s/it] 81%|████████▏ | 13/16 [00:52<00:13,  4.34s/it] 88%|████████▊ | 14/16 [00:57<00:08,  4.34s/it] 94%|█████████▍| 15/16 [01:01<00:04,  4.35s/it]100%|██████████| 16/16 [01:04<00:00,  3.96s/it]100%|██████████| 16/16 [01:05<00:00,  4.07s/it]
+  0%|          | 0/684 [00:00<?, ?it/s]  0%|          | 1/684 [00:00<02:41,  4.22it/s]  0%|          | 3/684 [00:00<01:18,  8.68it/s]  1%|          | 5/684 [00:00<01:03, 10.68it/s]  1%|          | 7/684 [00:00<00:57, 11.81it/s]  1%|▏         | 9/684 [00:00<00:53, 12.61it/s]  2%|▏         | 11/684 [00:00<00:51, 12.99it/s]  2%|▏         | 13/684 [00:01<00:51, 13.13it/s]  2%|▏         | 15/684 [00:01<00:50, 13.27it/s]  2%|▏         | 17/684 [00:01<00:49, 13.56it/s]  3%|▎         | 19/684 [00:01<00:49, 13.54it/s]  3%|▎         | 21/684 [00:01<00:49, 13.51it/s]  3%|▎         | 23/684 [00:01<00:49, 13.48it/s]  4%|▎         | 25/684 [00:01<00:48, 13.51it/s]  4%|▍         | 27/684 [00:02<00:48, 13.49it/s]  4%|▍         | 29/684 [00:02<00:48, 13.48it/s]  5%|▍         | 31/684 [00:02<00:48, 13.54it/s]  5%|▍         | 33/684 [00:02<00:47, 13.66it/s]  5%|▌         | 35/684 [00:02<00:47, 13.62it/s]  5%|▌         | 37/684 [00:02<00:47, 13.65it/s]  6%|▌         | 39/684 [00:03<00:47, 13.70it/s]  6%|▌         | 41/684 [00:03<00:46, 13.77it/s]  6%|▋         | 43/684 [00:03<00:46, 13.76it/s]  7%|▋         | 45/684 [00:03<00:46, 13.65it/s]  7%|▋         | 47/684 [00:03<00:46, 13.70it/s]  7%|▋         | 49/684 [00:03<00:46, 13.68it/s]  7%|▋         | 51/684 [00:03<00:45, 13.87it/s]  8%|▊         | 53/684 [00:04<00:45, 13.95it/s]  8%|▊         | 55/684 [00:04<00:45, 13.88it/s]  8%|▊         | 57/684 [00:04<00:44, 14.01it/s]  9%|▊         | 59/684 [00:04<00:44, 13.95it/s]  9%|▉         | 61/684 [00:04<00:44, 13.89it/s]  9%|▉         | 63/684 [00:04<00:45, 13.78it/s] 10%|▉         | 65/684 [00:04<00:45, 13.66it/s] 10%|▉         | 67/684 [00:05<00:45, 13.65it/s] 10%|█         | 69/684 [00:05<00:45, 13.60it/s] 10%|█         | 71/684 [00:05<00:45, 13.56it/s] 11%|█         | 73/684 [00:05<00:45, 13.52it/s] 11%|█         | 75/684 [00:05<00:44, 13.54it/s] 11%|█▏        | 77/684 [00:05<00:43, 13.82it/s] 12%|█▏        | 79/684 [00:05<00:43, 13.92it/s] 12%|█▏        | 81/684 [00:06<00:43, 13.92it/s] 12%|█▏        | 83/684 [00:06<00:42, 13.99it/s] 12%|█▏        | 85/684 [00:06<00:42, 13.98it/s] 13%|█▎        | 87/684 [00:06<00:42, 13.99it/s] 13%|█▎        | 89/684 [00:06<00:42, 13.87it/s] 13%|█▎        | 91/684 [00:06<00:43, 13.75it/s] 14%|█▎        | 93/684 [00:06<00:43, 13.65it/s] 14%|█▍        | 95/684 [00:07<00:43, 13.58it/s] 14%|█▍        | 97/684 [00:07<00:42, 13.75it/s] 14%|█▍        | 99/684 [00:07<00:42, 13.71it/s] 15%|█▍        | 101/684 [00:07<00:42, 13.71it/s] 15%|█▌        | 103/684 [00:07<00:42, 13.59it/s] 15%|█▌        | 105/684 [00:07<00:42, 13.56it/s] 16%|█▌        | 107/684 [00:07<00:42, 13.58it/s] 16%|█▌        | 109/684 [00:08<00:42, 13.62it/s] 16%|█▌        | 111/684 [00:08<00:42, 13.60it/s] 17%|█▋        | 113/684 [00:08<00:41, 13.65it/s] 17%|█▋        | 115/684 [00:08<00:41, 13.79it/s] 17%|█▋        | 117/684 [00:08<00:41, 13.80it/s] 17%|█▋        | 119/684 [00:08<00:40, 13.93it/s] 18%|█▊        | 121/684 [00:08<00:40, 13.79it/s] 18%|█▊        | 123/684 [00:09<00:40, 13.73it/s] 18%|█▊        | 125/684 [00:09<00:40, 13.79it/s] 19%|█▊        | 127/684 [00:09<00:39, 13.93it/s] 19%|█▉        | 129/684 [00:09<00:40, 13.77it/s] 19%|█▉        | 131/684 [00:09<00:40, 13.67it/s] 19%|█▉        | 133/684 [00:09<00:40, 13.67it/s] 20%|█▉        | 135/684 [00:09<00:40, 13.64it/s] 20%|██        | 137/684 [00:10<00:40, 13.58it/s] 20%|██        | 139/684 [00:10<00:40, 13.53it/s] 21%|██        | 141/684 [00:10<00:40, 13.51it/s] 21%|██        | 143/684 [00:10<00:40, 13.51it/s] 21%|██        | 145/684 [00:10<00:39, 13.66it/s] 21%|██▏       | 147/684 [00:10<00:38, 13.81it/s] 22%|██▏       | 149/684 [00:11<00:38, 13.74it/s] 22%|██▏       | 151/684 [00:11<00:39, 13.66it/s] 22%|██▏       | 153/684 [00:11<00:38, 13.63it/s] 23%|██▎       | 155/684 [00:11<00:38, 13.60it/s] 23%|██▎       | 157/684 [00:11<00:38, 13.77it/s] 23%|██▎       | 159/684 [00:11<00:37, 13.83it/s] 24%|██▎       | 161/684 [00:11<00:38, 13.75it/s] 24%|██▍       | 163/684 [00:12<00:37, 13.93it/s] 24%|██▍       | 165/684 [00:12<00:37, 13.97it/s] 24%|██▍       | 167/684 [00:12<00:37, 13.94it/s] 25%|██▍       | 169/684 [00:12<00:37, 13.79it/s] 25%|██▌       | 171/684 [00:12<00:37, 13.76it/s] 25%|██▌       | 173/684 [00:12<00:36, 13.89it/s] 26%|██▌       | 175/684 [00:12<00:37, 13.74it/s] 26%|██▌       | 177/684 [00:13<00:36, 13.89it/s] 26%|██▌       | 179/684 [00:13<00:36, 13.93it/s] 26%|██▋       | 181/684 [00:13<00:35, 14.04it/s] 27%|██▋       | 183/684 [00:13<00:35, 14.06it/s] 27%|██▋       | 185/684 [00:13<00:35, 14.05it/s] 27%|██▋       | 187/684 [00:13<00:35, 13.99it/s] 28%|██▊       | 189/684 [00:13<00:35, 14.03it/s] 28%|██▊       | 191/684 [00:14<00:35, 13.87it/s] 28%|██▊       | 193/684 [00:14<00:35, 13.79it/s] 29%|██▊       | 195/684 [00:14<00:35, 13.81it/s] 29%|██▉       | 197/684 [00:14<00:35, 13.81it/s] 29%|██▉       | 199/684 [00:14<00:35, 13.80it/s] 29%|██▉       | 201/684 [00:14<00:34, 13.81it/s] 30%|██▉       | 203/684 [00:14<00:34, 13.77it/s] 30%|██▉       | 205/684 [00:15<00:34, 13.79it/s] 30%|███       | 207/684 [00:15<00:34, 13.80it/s] 31%|███       | 209/684 [00:15<00:34, 13.89it/s] 31%|███       | 211/684 [00:15<00:34, 13.88it/s] 31%|███       | 213/684 [00:15<00:33, 13.87it/s] 31%|███▏      | 215/684 [00:15<00:33, 13.89it/s] 32%|███▏      | 217/684 [00:15<00:33, 13.93it/s] 32%|███▏      | 219/684 [00:16<00:33, 13.97it/s] 32%|███▏      | 221/684 [00:16<00:32, 14.03it/s] 33%|███▎      | 223/684 [00:16<00:33, 13.96it/s] 33%|███▎      | 225/684 [00:16<00:32, 14.06it/s] 33%|███▎      | 227/684 [00:16<00:32, 14.11it/s] 33%|███▎      | 229/684 [00:19<03:04,  2.47it/s] 34%|███▍      | 231/684 [00:19<02:17,  3.28it/s] 34%|███▍      | 233/684 [00:19<01:45,  4.26it/s] 34%|███▍      | 235/684 [00:19<01:23,  5.39it/s] 35%|███▍      | 237/684 [00:19<01:07,  6.59it/s] 35%|███▍      | 239/684 [00:19<00:58,  7.57it/s] 35%|███▌      | 241/684 [00:19<00:50,  8.74it/s] 36%|███▌      | 243/684 [00:20<00:46,  9.56it/s] 36%|███▌      | 245/684 [00:20<00:42, 10.45it/s] 36%|███▌      | 247/684 [00:20<00:38, 11.31it/s] 36%|███▋      | 249/684 [00:20<00:37, 11.63it/s] 37%|███▋      | 251/684 [00:20<00:35, 12.20it/s] 37%|███▋      | 253/684 [00:20<00:35, 12.28it/s] 37%|███▋      | 255/684 [00:20<00:34, 12.52it/s] 38%|███▊      | 257/684 [00:21<00:33, 12.72it/s] 38%|███▊      | 259/684 [00:21<00:33, 12.64it/s] 38%|███▊      | 261/684 [00:21<00:33, 12.65it/s] 38%|███▊      | 263/684 [00:21<00:33, 12.59it/s] 39%|███▊      | 265/684 [00:21<00:32, 12.74it/s] 39%|███▉      | 267/684 [00:21<00:32, 12.71it/s] 39%|███▉      | 269/684 [00:22<00:32, 12.64it/s] 40%|███▉      | 271/684 [00:22<00:31, 13.05it/s] 40%|███▉      | 273/684 [00:22<00:30, 13.42it/s] 40%|████      | 275/684 [00:22<00:31, 13.03it/s] 40%|████      | 277/684 [00:22<00:31, 13.01it/s] 41%|████      | 279/684 [00:22<00:31, 12.82it/s] 41%|████      | 281/684 [00:22<00:31, 12.74it/s] 41%|████▏     | 283/684 [00:23<00:31, 12.81it/s] 42%|████▏     | 285/684 [00:23<00:30, 12.90it/s] 42%|████▏     | 287/684 [00:23<00:30, 13.00it/s] 42%|████▏     | 289/684 [00:23<00:29, 13.30it/s] 43%|████▎     | 291/684 [00:23<00:30, 13.01it/s] 43%|████▎     | 293/684 [00:23<00:30, 12.80it/s] 43%|████▎     | 295/684 [00:24<00:29, 13.07it/s] 43%|████▎     | 297/684 [00:24<00:30, 12.79it/s] 44%|████▎     | 299/684 [00:24<00:29, 13.12it/s] 44%|████▍     | 301/684 [00:24<00:30, 12.73it/s] 44%|████▍     | 303/684 [00:24<00:29, 12.73it/s] 45%|████▍     | 305/684 [00:24<00:29, 12.93it/s] 45%|████▍     | 307/684 [00:25<00:29, 12.83it/s] 45%|████▌     | 309/684 [00:25<00:28, 13.19it/s] 45%|████▌     | 311/684 [00:25<00:28, 13.02it/s] 46%|████▌     | 313/684 [00:25<00:27, 13.40it/s] 46%|████▌     | 315/684 [00:25<00:27, 13.38it/s] 46%|████▋     | 317/684 [00:25<00:27, 13.35it/s] 47%|████▋     | 319/684 [00:25<00:27, 13.48it/s] 47%|████▋     | 321/684 [00:26<00:26, 13.64it/s] 47%|████▋     | 323/684 [00:26<00:26, 13.77it/s] 48%|████▊     | 325/684 [00:26<00:25, 13.83it/s] 48%|████▊     | 327/684 [00:26<00:25, 13.90it/s] 48%|████▊     | 329/684 [00:26<00:25, 13.96it/s] 48%|████▊     | 331/684 [00:26<00:25, 13.98it/s] 49%|████▊     | 333/684 [00:26<00:25, 14.03it/s] 49%|████▉     | 335/684 [00:27<00:24, 14.00it/s] 49%|████▉     | 337/684 [00:27<00:24, 14.06it/s] 50%|████▉     | 339/684 [00:27<00:24, 14.06it/s] 50%|████▉     | 341/684 [00:27<00:24, 14.01it/s] 50%|█████     | 343/684 [00:27<00:24, 14.00it/s] 50%|█████     | 345/684 [00:27<00:24, 14.01it/s] 51%|█████     | 347/684 [00:27<00:24, 13.99it/s] 51%|█████     | 349/684 [00:28<00:23, 13.99it/s] 51%|█████▏    | 351/684 [00:28<00:23, 14.02it/s] 52%|█████▏    | 353/684 [00:28<00:23, 14.02it/s] 52%|█████▏    | 355/684 [00:28<00:23, 14.02it/s] 52%|█████▏    | 357/684 [00:28<00:23, 14.02it/s] 52%|█████▏    | 359/684 [00:28<00:23, 14.02it/s] 53%|█████▎    | 361/684 [00:28<00:23, 14.02it/s] 53%|█████▎    | 363/684 [00:29<00:22, 14.00it/s] 53%|█████▎    | 365/684 [00:29<00:22, 14.00it/s] 54%|█████▎    | 367/684 [00:29<00:22, 14.00it/s] 54%|█████▍    | 369/684 [00:29<00:22, 14.01it/s] 54%|█████▍    | 371/684 [00:29<00:22, 14.03it/s] 55%|█████▍    | 373/684 [00:29<00:22, 14.01it/s] 55%|█████▍    | 375/684 [00:29<00:22, 14.02it/s] 55%|█████▌    | 377/684 [00:30<00:21, 14.01it/s] 55%|█████▌    | 379/684 [00:30<00:21, 14.05it/s] 56%|█████▌    | 381/684 [00:30<00:21, 14.04it/s] 56%|█████▌    | 383/684 [00:30<00:21, 14.02it/s] 56%|█████▋    | 385/684 [00:30<00:21, 14.00it/s] 57%|█████▋    | 387/684 [00:30<00:21, 13.98it/s] 57%|█████▋    | 389/684 [00:30<00:21, 13.99it/s] 57%|█████▋    | 391/684 [00:31<00:20, 14.02it/s] 57%|█████▋    | 393/684 [00:31<00:20, 14.04it/s] 58%|█████▊    | 395/684 [00:31<00:20, 14.01it/s] 58%|█████▊    | 397/684 [00:31<00:20, 13.99it/s] 58%|█████▊    | 399/684 [00:31<00:20, 14.00it/s] 59%|█████▊    | 401/684 [00:31<00:20, 14.01it/s] 59%|█████▉    | 403/684 [00:31<00:20, 13.99it/s] 59%|█████▉    | 405/684 [00:32<00:19, 14.00it/s] 60%|█████▉    | 407/684 [00:32<00:19, 14.01it/s] 60%|█████▉    | 409/684 [00:32<00:19, 14.02it/s] 60%|██████    | 411/684 [00:32<00:19, 14.01it/s] 60%|██████    | 413/684 [00:32<00:19, 14.01it/s] 61%|██████    | 415/684 [00:32<00:19, 14.03it/s] 61%|██████    | 417/684 [00:32<00:19, 14.02it/s] 61%|██████▏   | 419/684 [00:33<00:18, 14.01it/s] 62%|██████▏   | 421/684 [00:33<00:18, 14.02it/s] 62%|██████▏   | 423/684 [00:33<00:18, 14.01it/s] 62%|██████▏   | 425/684 [00:33<00:18, 14.04it/s] 62%|██████▏   | 427/684 [00:33<00:18, 14.01it/s] 63%|██████▎   | 429/684 [00:33<00:18, 14.02it/s] 63%|██████▎   | 431/684 [00:33<00:18, 14.02it/s] 63%|██████▎   | 433/684 [00:34<00:17, 14.07it/s] 64%|██████▎   | 435/684 [00:34<00:17, 14.01it/s] 64%|██████▍   | 437/684 [00:34<00:17, 13.98it/s] 64%|██████▍   | 439/684 [00:34<00:17, 14.00it/s] 64%|██████▍   | 441/684 [00:34<00:17, 14.02it/s] 65%|██████▍   | 443/684 [00:34<00:17, 14.03it/s] 65%|██████▌   | 445/684 [00:34<00:16, 14.07it/s] 65%|██████▌   | 447/684 [00:35<00:16, 14.04it/s] 66%|██████▌   | 449/684 [00:35<00:16, 14.02it/s] 66%|██████▌   | 451/684 [00:35<00:16, 13.99it/s] 66%|██████▌   | 453/684 [00:35<00:16, 13.99it/s] 67%|██████▋   | 455/684 [00:35<00:16, 14.01it/s] 67%|██████▋   | 457/684 [00:37<01:33,  2.44it/s] 67%|██████▋   | 459/684 [00:38<01:09,  3.24it/s] 67%|██████▋   | 461/684 [00:38<00:52,  4.21it/s] 68%|██████▊   | 463/684 [00:38<00:41,  5.33it/s] 68%|██████▊   | 465/684 [00:38<00:33,  6.50it/s] 68%|██████▊   | 467/684 [00:38<00:28,  7.65it/s] 69%|██████▊   | 469/684 [00:38<00:24,  8.80it/s] 69%|██████▉   | 471/684 [00:39<00:21,  9.78it/s] 69%|██████▉   | 473/684 [00:39<00:19, 10.59it/s] 69%|██████▉   | 475/684 [00:39<00:18, 11.38it/s] 70%|██████▉   | 477/684 [00:39<00:17, 12.10it/s] 70%|███████   | 479/684 [00:39<00:16, 12.25it/s] 70%|███████   | 481/684 [00:39<00:16, 12.55it/s] 71%|███████   | 483/684 [00:39<00:15, 12.84it/s] 71%|███████   | 485/684 [00:40<00:15, 12.77it/s] 71%|███████   | 487/684 [00:40<00:15, 12.87it/s] 71%|███████▏  | 489/684 [00:40<00:15, 12.90it/s] 72%|███████▏  | 491/684 [00:40<00:14, 12.87it/s] 72%|███████▏  | 493/684 [00:40<00:14, 12.98it/s] 72%|███████▏  | 495/684 [00:40<00:14, 12.86it/s] 73%|███████▎  | 497/684 [00:40<00:14, 13.05it/s] 73%|███████▎  | 499/684 [00:41<00:14, 12.87it/s]                                                  73%|███████▎  | 500/684 [00:41<00:14, 12.87it/s] 73%|███████▎  | 501/684 [00:41<00:14, 13.07it/s] 74%|███████▎  | 503/684 [00:41<00:14, 12.80it/s] 74%|███████▍  | 505/684 [00:41<00:13, 13.08it/s] 74%|███████▍  | 507/684 [00:41<00:13, 12.69it/s] 74%|███████▍  | 509/684 [00:41<00:13, 13.06it/s] 75%|███████▍  | 511/684 [00:42<00:13, 12.87it/s] 75%|███████▌  | 513/684 [00:42<00:13, 13.14it/s] 75%|███████▌  | 515/684 [00:42<00:13, 12.82it/s] 76%|███████▌  | 517/684 [00:42<00:12, 13.10it/s] 76%|███████▌  | 519/684 [00:42<00:12, 12.94it/s] 76%|███████▌  | 521/684 [00:42<00:12, 12.78it/s] 76%|███████▋  | 523/684 [00:43<00:12, 13.07it/s] 77%|███████▋  | 525/684 [00:43<00:12, 12.78it/s] 77%|███████▋  | 527/684 [00:43<00:12, 12.78it/s] 77%|███████▋  | 529/684 [00:43<00:12, 12.74it/s] 78%|███████▊  | 531/684 [00:43<00:12, 12.63it/s] 78%|███████▊  | 533/684 [00:43<00:11, 12.93it/s] 78%|███████▊  | 535/684 [00:43<00:11, 12.69it/s] 79%|███████▊  | 537/684 [00:44<00:11, 13.06it/s] 79%|███████▉  | 539/684 [00:44<00:11, 12.83it/s] 79%|███████▉  | 541/684 [00:44<00:10, 13.13it/s] 79%|███████▉  | 543/684 [00:44<00:10, 13.20it/s] 80%|███████▉  | 545/684 [00:44<00:10, 13.21it/s] 80%|███████▉  | 547/684 [00:44<00:10, 13.32it/s] 80%|████████  | 549/684 [00:44<00:09, 13.52it/s] 81%|████████  | 551/684 [00:45<00:09, 13.69it/s] 81%|████████  | 553/684 [00:45<00:09, 13.76it/s] 81%|████████  | 555/684 [00:45<00:09, 13.87it/s] 81%|████████▏ | 557/684 [00:45<00:09, 13.92it/s] 82%|████████▏ | 559/684 [00:45<00:08, 13.95it/s] 82%|████████▏ | 561/684 [00:45<00:08, 13.97it/s] 82%|████████▏ | 563/684 [00:45<00:08, 13.99it/s] 83%|████████▎ | 565/684 [00:46<00:08, 13.97it/s] 83%|████████▎ | 567/684 [00:46<00:08, 14.02it/s] 83%|████████▎ | 569/684 [00:46<00:08, 14.01it/s] 83%|████████▎ | 571/684 [00:46<00:08, 14.01it/s] 84%|████████▍ | 573/684 [00:46<00:07, 14.04it/s] 84%|████████▍ | 575/684 [00:46<00:07, 14.05it/s] 84%|████████▍ | 577/684 [00:46<00:07, 13.99it/s] 85%|████████▍ | 579/684 [00:47<00:07, 14.00it/s] 85%|████████▍ | 581/684 [00:47<00:07, 14.02it/s] 85%|████████▌ | 583/684 [00:47<00:07, 13.99it/s] 86%|████████▌ | 585/684 [00:47<00:07, 14.02it/s] 86%|████████▌ | 587/684 [00:47<00:06, 14.04it/s] 86%|████████▌ | 589/684 [00:47<00:06, 14.02it/s] 86%|████████▋ | 591/684 [00:47<00:06, 14.02it/s] 87%|████████▋ | 593/684 [00:48<00:06, 13.99it/s] 87%|████████▋ | 595/684 [00:48<00:06, 14.04it/s] 87%|████████▋ | 597/684 [00:48<00:06, 14.02it/s] 88%|████████▊ | 599/684 [00:48<00:06, 14.00it/s] 88%|████████▊ | 601/684 [00:48<00:05, 14.04it/s] 88%|████████▊ | 603/684 [00:48<00:05, 14.01it/s] 88%|████████▊ | 605/684 [00:48<00:05, 14.00it/s] 89%|████████▊ | 607/684 [00:49<00:05, 14.03it/s] 89%|████████▉ | 609/684 [00:49<00:05, 14.03it/s] 89%|████████▉ | 611/684 [00:49<00:05, 14.03it/s] 90%|████████▉ | 613/684 [00:49<00:05, 14.02it/s] 90%|████████▉ | 615/684 [00:49<00:04, 14.01it/s] 90%|█████████ | 617/684 [00:49<00:04, 14.00it/s] 90%|█████████ | 619/684 [00:49<00:04, 13.99it/s] 91%|█████████ | 621/684 [00:50<00:04, 14.00it/s] 91%|█████████ | 623/684 [00:50<00:04, 14.02it/s] 91%|█████████▏| 625/684 [00:50<00:04, 13.97it/s] 92%|█████████▏| 627/684 [00:50<00:04, 13.95it/s] 92%|█████████▏| 629/684 [00:50<00:03, 14.00it/s] 92%|█████████▏| 631/684 [00:50<00:03, 13.96it/s] 93%|█████████▎| 633/684 [00:50<00:03, 14.02it/s] 93%|█████████▎| 635/684 [00:51<00:03, 14.02it/s] 93%|█████████▎| 637/684 [00:51<00:03, 14.02it/s] 93%|█████████▎| 639/684 [00:51<00:03, 14.04it/s] 94%|█████████▎| 641/684 [00:51<00:03, 14.02it/s] 94%|█████████▍| 643/684 [00:51<00:02, 14.02it/s] 94%|█████████▍| 645/684 [00:51<00:02, 14.03it/s] 95%|█████████▍| 647/684 [00:51<00:02, 14.02it/s] 95%|█████████▍| 649/684 [00:52<00:02, 14.02it/s] 95%|█████████▌| 651/684 [00:52<00:02, 14.02it/s] 95%|█████████▌| 653/684 [00:52<00:02, 14.02it/s] 96%|█████████▌| 655/684 [00:52<00:02, 14.04it/s] 96%|█████████▌| 657/684 [00:52<00:01, 14.06it/s] 96%|█████████▋| 659/684 [00:52<00:01, 14.05it/s] 97%|█████████▋| 661/684 [00:52<00:01, 14.03it/s] 97%|█████████▋| 663/684 [00:53<00:01, 14.03it/s] 97%|█████████▋| 665/684 [00:53<00:01, 14.05it/s] 98%|█████████▊| 667/684 [00:53<00:01, 14.02it/s] 98%|█████████▊| 669/684 [00:53<00:01, 14.01it/s] 98%|█████████▊| 671/684 [00:53<00:00, 14.02it/s] 98%|█████████▊| 673/684 [00:53<00:00, 14.01it/s] 99%|█████████▊| 675/684 [00:53<00:00, 14.00it/s] 99%|█████████▉| 677/684 [00:54<00:00, 14.03it/s] 99%|█████████▉| 679/684 [00:54<00:00, 14.01it/s]100%|█████████▉| 681/684 [00:54<00:00, 14.03it/s]100%|█████████▉| 683/684 [00:54<00:00, 14.01it/s]                                                 100%|██████████| 684/684 [00:56<00:00, 14.01it/s]100%|██████████| 684/684 [00:56<00:00, 12.04it/s]
+  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:30,  2.21s/it] 19%|█▉        | 3/16 [00:08<00:40,  3.14s/it] 25%|██▌       | 4/16 [00:13<00:43,  3.62s/it] 31%|███▏      | 5/16 [00:17<00:42,  3.90s/it] 38%|███▊      | 6/16 [00:22<00:40,  4.07s/it] 44%|████▍     | 7/16 [00:26<00:37,  4.19s/it] 50%|█████     | 8/16 [00:30<00:34,  4.26s/it] 56%|█████▋    | 9/16 [00:35<00:30,  4.31s/it] 62%|██████▎   | 10/16 [00:39<00:26,  4.34s/it] 69%|██████▉   | 11/16 [00:44<00:21,  4.35s/it] 75%|███████▌  | 12/16 [00:48<00:17,  4.36s/it] 81%|████████▏ | 13/16 [00:52<00:13,  4.36s/it] 88%|████████▊ | 14/16 [00:57<00:08,  4.37s/it] 94%|█████████▍| 15/16 [01:01<00:04,  4.37s/it]100%|██████████| 16/16 [01:04<00:00,  3.98s/it]100%|██████████| 16/16 [01:05<00:00,  4.09s/it]
+/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/optimization.py:411: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning
+  warnings.warn(
+/mnt/storage/aatherton/hf_eng_fra_trans is already a clone of https://huggingface.co/aatherton2024/hf_eng_fra_trans. Make sure you pull the latest changes with `repo.git_pull()`.
+Traceback (most recent call last):
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_errors.py", line 261, in hf_raise_for_status
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/requests/models.py", line 1021, in raise_for_status
+    raise HTTPError(http_error_msg, response=self)
+requests.exceptions.HTTPError: 404 Client Error: Not Found for url: https://huggingface.co/aatherton2024/hf_synth_trans/resolve/main/config.json
+
+The above exception was the direct cause of the following exception:
+
+Traceback (most recent call last):
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/utils/hub.py", line 428, in cached_file
+    resolved_file = hf_hub_download(
+                    ^^^^^^^^^^^^^^^^
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_validators.py", line 118, in _inner_fn
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/file_download.py", line 1230, in hf_hub_download
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_validators.py", line 118, in _inner_fn
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/file_download.py", line 1606, in get_hf_file_metadata
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/huggingface_hub-0.17.1-py3.8.egg/huggingface_hub/utils/_errors.py", line 271, in hf_raise_for_status
+huggingface_hub.utils._errors.EntryNotFoundError: 404 Client Error. (Request ID: Root=1-6508f53c-403d6b2e4c215eb0090d4b33;cdf95f5b-24d2-49b8-9434-cfaa697f931b)
+
+Entry Not Found for url: https://huggingface.co/aatherton2024/hf_synth_trans/resolve/main/config.json.
+
+The above exception was the direct cause of the following exception:
+
+Traceback (most recent call last):
+  File "/mnt/storage/aatherton/hf_synth_trans/synth_translation.py", line 268, in <module>
+    translator = pipeline("translation", model=model_checkpoint)
+                 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/pipelines/__init__.py", line 724, in pipeline
+    config = AutoConfig.from_pretrained(model, _from_pipeline=task, **hub_kwargs, **model_kwargs)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/models/auto/configuration_auto.py", line 1007, in from_pretrained
+    config_dict, unused_kwargs = PretrainedConfig.get_config_dict(pretrained_model_name_or_path, **kwargs)
+                                 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/configuration_utils.py", line 620, in get_config_dict
+    config_dict, kwargs = cls._get_config_dict(pretrained_model_name_or_path, **kwargs)
+                          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/configuration_utils.py", line 675, in _get_config_dict
+    resolved_config_file = cached_file(
+                           ^^^^^^^^^^^^
+  File "/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/utils/hub.py", line 479, in cached_file
+    raise EnvironmentError(
+OSError: aatherton2024/hf_synth_trans does not appear to have a file named config.json. Checkout 'https://huggingface.co/aatherton2024/hf_synth_trans/main' for available files.
diff --git a/myerrors_1601.out b/myerrors_1601.out
new file mode 100644
index 0000000000000000000000000000000000000000..e6b212d430b00355805f9df87ae54b9e85efa500
--- /dev/null
+++ b/myerrors_1601.out
@@ -0,0 +1,16 @@
+You're using a GPT2TokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.
+  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:05<00:35,  2.54s/it] 19%|█▉        | 3/16 [00:09<00:43,  3.37s/it] 25%|██▌       | 4/16 [00:14<00:45,  3.79s/it] 31%|███▏      | 5/16 [00:18<00:44,  4.03s/it] 38%|███▊      | 6/16 [00:23<00:42,  4.22s/it] 44%|████▍     | 7/16 [00:27<00:38,  4.31s/it] 50%|█████     | 8/16 [00:32<00:34,  4.36s/it] 56%|█████▋    | 9/16 [00:36<00:30,  4.41s/it] 62%|██████▎   | 10/16 [00:41<00:26,  4.46s/it] 69%|██████▉   | 11/16 [00:45<00:22,  4.49s/it] 75%|███████▌  | 12/16 [00:50<00:17,  4.49s/it] 81%|████████▏ | 13/16 [00:54<00:13,  4.49s/it] 88%|████████▊ | 14/16 [00:59<00:08,  4.49s/it] 94%|█████████▍| 15/16 [01:03<00:04,  4.49s/it]100%|██████████| 16/16 [01:06<00:00,  4.09s/it]100%|██████████| 16/16 [01:07<00:00,  4.23s/it]
+  0%|          | 0/684 [00:00<?, ?it/s]  0%|          | 1/684 [00:00<02:39,  4.29it/s]  0%|          | 3/684 [00:00<01:18,  8.69it/s]  1%|          | 5/684 [00:00<01:03, 10.63it/s]  1%|          | 7/684 [00:00<00:58, 11.63it/s]  1%|▏         | 9/684 [00:00<00:55, 12.22it/s]  2%|▏         | 11/684 [00:00<00:53, 12.57it/s]  2%|▏         | 13/684 [00:01<00:52, 12.89it/s]  2%|▏         | 15/684 [00:01<00:51, 13.00it/s]  2%|▏         | 17/684 [00:01<00:50, 13.13it/s]  3%|▎         | 19/684 [00:01<00:50, 13.27it/s]  3%|▎         | 21/684 [00:01<00:49, 13.29it/s]  3%|▎         | 23/684 [00:01<00:50, 13.10it/s]  4%|▎         | 25/684 [00:02<00:50, 13.16it/s]  4%|▍         | 27/684 [00:02<00:49, 13.31it/s]  4%|▍         | 29/684 [00:02<00:49, 13.28it/s]  5%|▍         | 31/684 [00:02<00:48, 13.44it/s]  5%|▍         | 33/684 [00:02<00:48, 13.38it/s]  5%|▌         | 35/684 [00:02<00:48, 13.31it/s]  5%|▌         | 37/684 [00:02<00:48, 13.31it/s]  6%|▌         | 39/684 [00:03<00:47, 13.49it/s]  6%|▌         | 41/684 [00:03<00:47, 13.47it/s]  6%|▋         | 43/684 [00:03<00:48, 13.25it/s]  7%|▋         | 45/684 [00:03<00:48, 13.17it/s]  7%|▋         | 47/684 [00:03<00:48, 13.14it/s]  7%|▋         | 49/684 [00:03<00:48, 13.07it/s]  7%|▋         | 51/684 [00:03<00:48, 13.10it/s]  8%|▊         | 53/684 [00:04<00:48, 13.02it/s]  8%|▊         | 55/684 [00:04<00:48, 12.95it/s]  8%|▊         | 57/684 [00:04<00:48, 12.97it/s]  9%|▊         | 59/684 [00:04<00:47, 13.09it/s]  9%|▉         | 61/684 [00:04<00:47, 13.07it/s]  9%|▉         | 63/684 [00:04<00:47, 13.05it/s] 10%|▉         | 65/684 [00:05<00:47, 13.07it/s] 10%|▉         | 67/684 [00:05<00:47, 13.08it/s] 10%|█         | 69/684 [00:05<00:46, 13.09it/s] 10%|█         | 71/684 [00:05<00:46, 13.16it/s] 11%|█         | 73/684 [00:05<00:46, 13.14it/s] 11%|█         | 75/684 [00:05<00:46, 13.11it/s] 11%|█▏        | 77/684 [00:05<00:46, 13.17it/s] 12%|█▏        | 79/684 [00:06<00:46, 13.13it/s] 12%|█▏        | 81/684 [00:06<00:46, 13.11it/s] 12%|█▏        | 83/684 [00:06<00:45, 13.13it/s] 12%|█▏        | 85/684 [00:06<00:45, 13.12it/s] 13%|█▎        | 87/684 [00:06<00:45, 13.12it/s] 13%|█▎        | 89/684 [00:06<00:45, 13.09it/s] 13%|█▎        | 91/684 [00:07<00:45, 13.13it/s] 14%|█▎        | 93/684 [00:07<00:44, 13.17it/s] 14%|█▍        | 95/684 [00:07<00:44, 13.16it/s] 14%|█▍        | 97/684 [00:07<00:44, 13.12it/s] 14%|█▍        | 99/684 [00:07<00:44, 13.10it/s] 15%|█▍        | 101/684 [00:07<00:44, 13.09it/s] 15%|█▌        | 103/684 [00:07<00:44, 13.09it/s] 15%|█▌        | 105/684 [00:08<00:44, 13.08it/s] 16%|█▌        | 107/684 [00:08<00:44, 13.07it/s] 16%|█▌        | 109/684 [00:08<00:43, 13.13it/s] 16%|█▌        | 111/684 [00:08<00:43, 13.27it/s] 17%|█▋        | 113/684 [00:08<00:42, 13.49it/s] 17%|█▋        | 115/684 [00:08<00:42, 13.43it/s] 17%|█▋        | 117/684 [00:09<00:42, 13.32it/s] 17%|█▋        | 119/684 [00:09<00:42, 13.30it/s] 18%|█▊        | 121/684 [00:09<00:42, 13.18it/s] 18%|█▊        | 123/684 [00:09<00:42, 13.15it/s] 18%|█▊        | 125/684 [00:09<00:41, 13.43it/s] 19%|█▊        | 127/684 [00:09<00:41, 13.54it/s] 19%|█▉        | 129/684 [00:09<00:40, 13.57it/s] 19%|█▉        | 131/684 [00:10<00:40, 13.58it/s] 19%|█▉        | 133/684 [00:10<00:40, 13.68it/s] 20%|█▉        | 135/684 [00:10<00:40, 13.69it/s] 20%|██        | 137/684 [00:10<00:40, 13.67it/s] 20%|██        | 139/684 [00:10<00:39, 13.72it/s] 21%|██        | 141/684 [00:10<00:39, 13.73it/s] 21%|██        | 143/684 [00:10<00:39, 13.73it/s] 21%|██        | 145/684 [00:11<00:39, 13.71it/s] 21%|██▏       | 147/684 [00:11<00:39, 13.73it/s] 22%|██▏       | 149/684 [00:11<00:38, 13.72it/s] 22%|██▏       | 151/684 [00:11<00:38, 13.70it/s] 22%|██▏       | 153/684 [00:11<00:38, 13.71it/s] 23%|██▎       | 155/684 [00:11<00:38, 13.71it/s] 23%|██▎       | 157/684 [00:11<00:38, 13.71it/s] 23%|██▎       | 159/684 [00:12<00:38, 13.69it/s] 24%|██▎       | 161/684 [00:12<00:38, 13.67it/s] 24%|██▍       | 163/684 [00:12<00:38, 13.64it/s] 24%|██▍       | 165/684 [00:12<00:37, 13.71it/s] 24%|██▍       | 167/684 [00:12<00:37, 13.70it/s] 25%|██▍       | 169/684 [00:12<00:37, 13.70it/s] 25%|██▌       | 171/684 [00:12<00:37, 13.70it/s] 25%|██▌       | 173/684 [00:13<00:37, 13.70it/s] 26%|██▌       | 175/684 [00:13<00:37, 13.71it/s] 26%|██▌       | 177/684 [00:13<00:37, 13.69it/s] 26%|██▌       | 179/684 [00:13<00:36, 13.73it/s] 26%|██▋       | 181/684 [00:13<00:36, 13.70it/s] 27%|██▋       | 183/684 [00:13<00:36, 13.73it/s] 27%|██▋       | 185/684 [00:13<00:36, 13.74it/s] 27%|██▋       | 187/684 [00:14<00:36, 13.69it/s] 28%|██▊       | 189/684 [00:14<00:36, 13.66it/s] 28%|██▊       | 191/684 [00:14<00:36, 13.65it/s] 28%|██▊       | 193/684 [00:14<00:35, 13.68it/s] 29%|██▊       | 195/684 [00:14<00:35, 13.71it/s] 29%|██▉       | 197/684 [00:14<00:35, 13.73it/s] 29%|██▉       | 199/684 [00:15<00:35, 13.75it/s] 29%|██▉       | 201/684 [00:15<00:35, 13.75it/s] 30%|██▉       | 203/684 [00:15<00:34, 13.78it/s] 30%|██▉       | 205/684 [00:15<00:34, 13.82it/s] 30%|███       | 207/684 [00:15<00:34, 13.83it/s] 31%|███       | 209/684 [00:15<00:34, 13.78it/s] 31%|███       | 211/684 [00:15<00:34, 13.81it/s] 31%|███       | 213/684 [00:16<00:34, 13.76it/s] 31%|███▏      | 215/684 [00:16<00:34, 13.75it/s] 32%|███▏      | 217/684 [00:16<00:33, 13.76it/s] 32%|███▏      | 219/684 [00:16<00:33, 13.76it/s] 32%|███▏      | 221/684 [00:16<00:33, 13.74it/s] 33%|███▎      | 223/684 [00:16<00:33, 13.73it/s] 33%|███▎      | 225/684 [00:16<00:33, 13.70it/s] 33%|███▎      | 227/684 [00:17<00:33, 13.75it/s] 33%|███▎      | 229/684 [00:19<03:05,  2.46it/s] 34%|███▍      | 231/684 [00:19<02:17,  3.29it/s] 34%|███▍      | 233/684 [00:19<01:44,  4.31it/s] 34%|███▍      | 235/684 [00:19<01:21,  5.50it/s] 35%|███▍      | 237/684 [00:19<01:05,  6.83it/s] 35%|███▍      | 239/684 [00:20<00:56,  7.92it/s] 35%|███▌      | 241/684 [00:20<00:49,  8.86it/s] 36%|███▌      | 243/684 [00:20<00:44,  9.84it/s] 36%|███▌      | 245/684 [00:20<00:42, 10.34it/s] 36%|███▌      | 247/684 [00:20<00:40, 10.88it/s] 36%|███▋      | 249/684 [00:20<00:38, 11.37it/s] 37%|███▋      | 251/684 [00:21<00:36, 11.73it/s] 37%|███▋      | 253/684 [00:21<00:35, 12.23it/s] 37%|███▋      | 255/684 [00:21<00:35, 12.24it/s] 38%|███▊      | 257/684 [00:21<00:33, 12.66it/s] 38%|███▊      | 259/684 [00:21<00:33, 12.70it/s] 38%|███▊      | 261/684 [00:21<00:33, 12.81it/s] 38%|███▊      | 263/684 [00:21<00:32, 12.84it/s] 39%|███▊      | 265/684 [00:22<00:32, 12.99it/s] 39%|███▉      | 267/684 [00:22<00:31, 13.05it/s] 39%|███▉      | 269/684 [00:22<00:32, 12.72it/s] 40%|███▉      | 271/684 [00:22<00:32, 12.65it/s] 40%|███▉      | 273/684 [00:22<00:31, 12.87it/s] 40%|████      | 275/684 [00:22<00:30, 13.22it/s] 40%|████      | 277/684 [00:23<00:30, 13.46it/s] 41%|████      | 279/684 [00:23<00:30, 13.14it/s] 41%|████      | 281/684 [00:23<00:30, 13.28it/s] 41%|████▏     | 283/684 [00:23<00:30, 12.98it/s] 42%|████▏     | 285/684 [00:23<00:30, 13.14it/s] 42%|████▏     | 287/684 [00:23<00:31, 12.68it/s] 42%|████▏     | 289/684 [00:23<00:30, 13.05it/s] 43%|████▎     | 291/684 [00:24<00:30, 12.80it/s] 43%|████▎     | 293/684 [00:24<00:30, 12.89it/s] 43%|████▎     | 295/684 [00:24<00:30, 12.77it/s] 43%|████▎     | 297/684 [00:24<00:30, 12.70it/s] 44%|████▎     | 299/684 [00:24<00:29, 12.86it/s] 44%|████▍     | 301/684 [00:24<00:29, 13.09it/s] 44%|████▍     | 303/684 [00:25<00:29, 12.80it/s] 45%|████▍     | 305/684 [00:25<00:29, 12.73it/s] 45%|████▍     | 307/684 [00:25<00:29, 12.79it/s] 45%|████▌     | 309/684 [00:25<00:29, 12.71it/s] 45%|████▌     | 311/684 [00:25<00:29, 12.65it/s] 46%|████▌     | 313/684 [00:25<00:28, 12.92it/s] 46%|████▌     | 315/684 [00:26<00:29, 12.69it/s] 46%|████▋     | 317/684 [00:26<00:28, 12.92it/s] 47%|████▋     | 319/684 [00:26<00:27, 13.06it/s] 47%|████▋     | 321/684 [00:26<00:27, 13.17it/s] 47%|████▋     | 323/684 [00:26<00:27, 13.31it/s] 48%|████▊     | 325/684 [00:26<00:26, 13.49it/s] 48%|████▊     | 327/684 [00:26<00:26, 13.65it/s] 48%|████▊     | 329/684 [00:27<00:25, 13.76it/s] 48%|████▊     | 331/684 [00:27<00:25, 13.84it/s] 49%|████▊     | 333/684 [00:27<00:25, 13.91it/s] 49%|████▉     | 335/684 [00:27<00:25, 13.76it/s] 49%|████▉     | 337/684 [00:27<00:25, 13.75it/s] 50%|████▉     | 339/684 [00:27<00:24, 13.81it/s] 50%|████▉     | 341/684 [00:27<00:24, 13.90it/s] 50%|█████     | 343/684 [00:28<00:24, 13.94it/s] 50%|█████     | 345/684 [00:28<00:24, 13.96it/s] 51%|█████     | 347/684 [00:28<00:24, 14.00it/s] 51%|█████     | 349/684 [00:28<00:23, 14.01it/s] 51%|█████▏    | 351/684 [00:28<00:23, 14.03it/s] 52%|█████▏    | 353/684 [00:28<00:23, 14.04it/s] 52%|█████▏    | 355/684 [00:28<00:23, 14.04it/s] 52%|█████▏    | 357/684 [00:29<00:23, 14.06it/s] 52%|█████▏    | 359/684 [00:29<00:23, 14.04it/s] 53%|█████▎    | 361/684 [00:29<00:23, 14.04it/s] 53%|█████▎    | 363/684 [00:29<00:22, 14.01it/s] 53%|█████▎    | 365/684 [00:29<00:22, 14.03it/s] 54%|█████▎    | 367/684 [00:29<00:22, 14.02it/s] 54%|█████▍    | 369/684 [00:29<00:22, 14.03it/s] 54%|█████▍    | 371/684 [00:30<00:22, 13.99it/s] 55%|█████▍    | 373/684 [00:30<00:22, 14.03it/s] 55%|█████▍    | 375/684 [00:30<00:22, 14.02it/s] 55%|█████▌    | 377/684 [00:30<00:21, 14.02it/s] 55%|█████▌    | 379/684 [00:30<00:21, 14.04it/s] 56%|█████▌    | 381/684 [00:30<00:21, 14.06it/s] 56%|█████▌    | 383/684 [00:30<00:21, 14.03it/s] 56%|█████▋    | 385/684 [00:31<00:21, 14.03it/s] 57%|█████▋    | 387/684 [00:31<00:21, 14.04it/s] 57%|█████▋    | 389/684 [00:31<00:21, 14.05it/s] 57%|█████▋    | 391/684 [00:31<00:20, 13.98it/s] 57%|█████▋    | 393/684 [00:31<00:20, 14.01it/s] 58%|█████▊    | 395/684 [00:31<00:20, 14.04it/s] 58%|█████▊    | 397/684 [00:31<00:20, 14.02it/s] 58%|█████▊    | 399/684 [00:32<00:20, 14.01it/s] 59%|█████▊    | 401/684 [00:32<00:20, 14.02it/s] 59%|█████▉    | 403/684 [00:32<00:20, 14.01it/s] 59%|█████▉    | 405/684 [00:32<00:19, 14.03it/s] 60%|█████▉    | 407/684 [00:32<00:19, 14.03it/s] 60%|█████▉    | 409/684 [00:32<00:19, 14.04it/s] 60%|██████    | 411/684 [00:32<00:19, 14.03it/s] 60%|██████    | 413/684 [00:33<00:19, 14.03it/s] 61%|██████    | 415/684 [00:33<00:19, 14.05it/s] 61%|██████    | 417/684 [00:33<00:19, 14.03it/s] 61%|██████▏   | 419/684 [00:33<00:18, 14.00it/s] 62%|██████▏   | 421/684 [00:33<00:18, 14.01it/s] 62%|██████▏   | 423/684 [00:33<00:18, 14.01it/s] 62%|██████▏   | 425/684 [00:33<00:18, 14.01it/s] 62%|██████▏   | 427/684 [00:34<00:18, 14.00it/s] 63%|██████▎   | 429/684 [00:34<00:18, 14.00it/s] 63%|██████▎   | 431/684 [00:34<00:18, 14.02it/s] 63%|██████▎   | 433/684 [00:34<00:17, 14.01it/s] 64%|██████▎   | 435/684 [00:34<00:17, 14.02it/s] 64%|██████▍   | 437/684 [00:34<00:17, 14.02it/s] 64%|██████▍   | 439/684 [00:34<00:17, 14.01it/s] 64%|██████▍   | 441/684 [00:35<00:17, 14.01it/s] 65%|██████▍   | 443/684 [00:35<00:17, 14.00it/s] 65%|██████▌   | 445/684 [00:35<00:17, 14.00it/s] 65%|██████▌   | 447/684 [00:35<00:16, 14.00it/s] 66%|██████▌   | 449/684 [00:35<00:16, 14.02it/s] 66%|██████▌   | 451/684 [00:35<00:16, 14.02it/s] 66%|██████▌   | 453/684 [00:35<00:16, 14.01it/s] 67%|██████▋   | 455/684 [00:36<00:16, 14.01it/s] 67%|██████▋   | 457/684 [00:38<01:31,  2.48it/s] 67%|██████▋   | 459/684 [00:38<01:08,  3.29it/s] 67%|██████▋   | 461/684 [00:38<00:52,  4.27it/s] 68%|██████▊   | 463/684 [00:38<00:40,  5.40it/s] 68%|██████▊   | 465/684 [00:38<00:33,  6.56it/s] 68%|██████▊   | 467/684 [00:39<00:28,  7.70it/s] 69%|██████▊   | 469/684 [00:39<00:24,  8.88it/s] 69%|██████▉   | 471/684 [00:39<00:21,  9.68it/s] 69%|██████▉   | 473/684 [00:39<00:19, 10.73it/s] 69%|██████▉   | 475/684 [00:39<00:18, 11.01it/s] 70%|██████▉   | 477/684 [00:39<00:17, 11.71it/s] 70%|███████   | 479/684 [00:40<00:17, 11.91it/s] 70%|███████   | 481/684 [00:40<00:16, 12.22it/s] 71%|███████   | 483/684 [00:40<00:16, 12.13it/s] 71%|███████   | 485/684 [00:40<00:15, 12.57it/s] 71%|███████   | 487/684 [00:40<00:15, 12.66it/s] 71%|███████▏  | 489/684 [00:40<00:15, 12.75it/s] 72%|███████▏  | 491/684 [00:40<00:14, 12.96it/s] 72%|███████▏  | 493/684 [00:41<00:14, 12.79it/s] 72%|███████▏  | 495/684 [00:41<00:14, 13.17it/s] 73%|███████▎  | 497/684 [00:41<00:14, 12.85it/s] 73%|███████▎  | 499/684 [00:41<00:14, 12.89it/s]                                                  73%|███████▎  | 500/684 [00:41<00:14, 12.89it/s] 73%|███████▎  | 501/684 [00:41<00:14, 12.82it/s] 74%|███████▎  | 503/684 [00:41<00:14, 12.65it/s] 74%|███████▍  | 505/684 [00:42<00:13, 12.89it/s] 74%|███████▍  | 507/684 [00:42<00:13, 13.20it/s] 74%|███████▍  | 509/684 [00:42<00:13, 12.75it/s] 75%|███████▍  | 511/684 [00:42<00:13, 13.14it/s] 75%|███████▌  | 513/684 [00:42<00:13, 12.84it/s] 75%|███████▌  | 515/684 [00:42<00:12, 13.20it/s] 76%|███████▌  | 517/684 [00:42<00:12, 13.02it/s] 76%|███████▌  | 519/684 [00:43<00:12, 13.12it/s] 76%|███████▌  | 521/684 [00:43<00:12, 13.45it/s] 76%|███████▋  | 523/684 [00:43<00:12, 12.92it/s] 77%|███████▋  | 525/684 [00:43<00:12, 13.08it/s] 77%|███████▋  | 527/684 [00:43<00:11, 13.36it/s] 77%|███████▋  | 529/684 [00:43<00:11, 12.98it/s] 78%|███████▊  | 531/684 [00:44<00:11, 13.26it/s] 78%|███████▊  | 533/684 [00:44<00:11, 12.91it/s] 78%|███████▊  | 535/684 [00:44<00:11, 13.15it/s] 79%|███████▊  | 537/684 [00:44<00:11, 12.85it/s] 79%|███████▉  | 539/684 [00:44<00:11, 12.94it/s] 79%|███████▉  | 541/684 [00:44<00:11, 12.69it/s] 79%|███████▉  | 543/684 [00:44<00:10, 13.00it/s] 80%|███████▉  | 545/684 [00:45<00:11, 12.60it/s] 80%|███████▉  | 547/684 [00:45<00:10, 12.85it/s] 80%|████████  | 549/684 [00:45<00:10, 12.81it/s] 81%|████████  | 551/684 [00:45<00:10, 12.98it/s] 81%|████████  | 553/684 [00:45<00:09, 13.26it/s] 81%|████████  | 555/684 [00:45<00:09, 13.48it/s] 81%|████████▏ | 557/684 [00:46<00:09, 13.43it/s] 82%|████████▏ | 559/684 [00:46<00:09, 13.52it/s] 82%|████████▏ | 561/684 [00:46<00:09, 13.40it/s] 82%|████████▏ | 563/684 [00:46<00:08, 13.52it/s] 83%|████████▎ | 565/684 [00:46<00:08, 13.71it/s] 83%|████████▎ | 567/684 [00:46<00:08, 13.85it/s] 83%|████████▎ | 569/684 [00:46<00:08, 13.90it/s] 83%|████████▎ | 571/684 [00:47<00:08, 13.93it/s] 84%|████████▍ | 573/684 [00:47<00:07, 13.98it/s] 84%|████████▍ | 575/684 [00:47<00:07, 13.99it/s] 84%|████████▍ | 577/684 [00:47<00:07, 13.98it/s] 85%|████████▍ | 579/684 [00:47<00:07, 14.00it/s] 85%|████████▍ | 581/684 [00:47<00:07, 14.01it/s] 85%|████████▌ | 583/684 [00:47<00:07, 14.02it/s] 86%|████████▌ | 585/684 [00:48<00:07, 14.02it/s] 86%|████████▌ | 587/684 [00:48<00:06, 14.02it/s] 86%|████████▌ | 589/684 [00:48<00:06, 14.01it/s] 86%|████████▋ | 591/684 [00:48<00:06, 14.03it/s] 87%|████████▋ | 593/684 [00:48<00:06, 14.01it/s] 87%|████████▋ | 595/684 [00:48<00:06, 14.02it/s] 87%|████████▋ | 597/684 [00:48<00:06, 14.01it/s] 88%|████████▊ | 599/684 [00:49<00:06, 13.98it/s] 88%|████████▊ | 601/684 [00:49<00:05, 14.01it/s] 88%|████████▊ | 603/684 [00:49<00:05, 14.01it/s] 88%|████████▊ | 605/684 [00:49<00:05, 14.00it/s] 89%|████████▊ | 607/684 [00:49<00:05, 14.03it/s] 89%|████████▉ | 609/684 [00:49<00:05, 14.02it/s] 89%|████████▉ | 611/684 [00:49<00:05, 14.02it/s] 90%|████████▉ | 613/684 [00:50<00:05, 14.03it/s] 90%|████████▉ | 615/684 [00:50<00:04, 14.02it/s] 90%|█████████ | 617/684 [00:50<00:04, 14.01it/s] 90%|█████████ | 619/684 [00:50<00:04, 14.02it/s] 91%|█████████ | 621/684 [00:50<00:04, 14.04it/s] 91%|█████████ | 623/684 [00:50<00:04, 14.06it/s] 91%|█████████▏| 625/684 [00:50<00:04, 14.04it/s] 92%|█████████▏| 627/684 [00:51<00:04, 14.03it/s] 92%|█████████▏| 629/684 [00:51<00:03, 14.02it/s] 92%|█████████▏| 631/684 [00:51<00:03, 14.03it/s] 93%|█████████▎| 633/684 [00:51<00:03, 14.03it/s] 93%|█████████▎| 635/684 [00:51<00:03, 14.03it/s] 93%|█████████▎| 637/684 [00:51<00:03, 14.02it/s] 93%|█████████▎| 639/684 [00:51<00:03, 14.03it/s] 94%|█████████▎| 641/684 [00:52<00:03, 14.02it/s] 94%|█████████▍| 643/684 [00:52<00:02, 14.02it/s] 94%|█████████▍| 645/684 [00:52<00:02, 13.99it/s] 95%|█████████▍| 647/684 [00:52<00:02, 14.00it/s] 95%|█████████▍| 649/684 [00:52<00:02, 14.02it/s] 95%|█████████▌| 651/684 [00:52<00:02, 14.04it/s] 95%|█████████▌| 653/684 [00:52<00:02, 14.05it/s] 96%|█████████▌| 655/684 [00:53<00:02, 14.05it/s] 96%|█████████▌| 657/684 [00:53<00:01, 14.05it/s] 96%|█████████▋| 659/684 [00:53<00:01, 14.03it/s] 97%|█████████▋| 661/684 [00:53<00:01, 14.01it/s] 97%|█████████▋| 663/684 [00:53<00:01, 14.03it/s] 97%|█████████▋| 665/684 [00:53<00:01, 14.03it/s] 98%|█████████▊| 667/684 [00:53<00:01, 14.04it/s] 98%|█████████▊| 669/684 [00:54<00:01, 14.05it/s] 98%|█████████▊| 671/684 [00:54<00:00, 14.04it/s] 98%|█████████▊| 673/684 [00:54<00:00, 14.03it/s] 99%|█████████▊| 675/684 [00:54<00:00, 14.00it/s] 99%|█████████▉| 677/684 [00:54<00:00, 14.00it/s] 99%|█████████▉| 679/684 [00:54<00:00, 14.00it/s]100%|█████████▉| 681/684 [00:54<00:00, 14.00it/s]100%|█████████▉| 683/684 [00:55<00:00, 13.99it/s]                                                 100%|██████████| 684/684 [00:57<00:00, 13.99it/s]100%|██████████| 684/684 [00:57<00:00, 11.94it/s]
+  0%|          | 0/16 [00:00<?, ?it/s] 12%|█▎        | 2/16 [00:04<00:31,  2.25s/it] 19%|█▉        | 3/16 [00:08<00:41,  3.19s/it] 25%|██▌       | 4/16 [00:13<00:44,  3.68s/it] 31%|███▏      | 5/16 [00:18<00:43,  3.96s/it] 38%|███▊      | 6/16 [00:22<00:41,  4.14s/it] 44%|████▍     | 7/16 [00:27<00:38,  4.26s/it] 50%|█████     | 8/16 [00:31<00:34,  4.34s/it] 56%|█████▋    | 9/16 [00:36<00:30,  4.39s/it] 62%|██████▎   | 10/16 [00:40<00:26,  4.43s/it] 69%|██████▉   | 11/16 [00:45<00:22,  4.45s/it] 75%|███████▌  | 12/16 [00:49<00:17,  4.47s/it] 81%|████████▏ | 13/16 [00:54<00:13,  4.48s/it] 88%|████████▊ | 14/16 [00:58<00:08,  4.48s/it] 94%|█████████▍| 15/16 [01:03<00:04,  4.48s/it]100%|██████████| 16/16 [01:06<00:00,  4.09s/it]100%|██████████| 16/16 [01:06<00:00,  4.18s/it]
+/mnt/storage/aatherton/anaconda3/envs/nmt/lib/python3.11/site-packages/transformers/optimization.py:411: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning
+  warnings.warn(
+/mnt/storage/aatherton/hf_eng_fra_trans is already a clone of https://huggingface.co/aatherton2024/hf_eng_fra_trans. Make sure you pull the latest changes with `repo.git_pull()`.
+Downloading (…)lve/main/config.json:   0%|          | 0.00/1.43k [00:00<?, ?B/s]Downloading (…)lve/main/config.json: 100%|██████████| 1.43k/1.43k [00:00<00:00, 3.81MB/s]
+Downloading pytorch_model.bin:   0%|          | 0.00/299M [00:00<?, ?B/s]Downloading pytorch_model.bin:   4%|▎         | 10.5M/299M [00:00<00:05, 50.0MB/s]Downloading pytorch_model.bin:   7%|▋         | 21.0M/299M [00:00<00:03, 72.0MB/s]Downloading pytorch_model.bin:  14%|█▍        | 41.9M/299M [00:00<00:02, 95.3MB/s]Downloading pytorch_model.bin:  21%|██        | 62.9M/299M [00:00<00:02, 101MB/s] Downloading pytorch_model.bin:  28%|██▊       | 83.9M/299M [00:00<00:02, 107MB/s]Downloading pytorch_model.bin:  35%|███▌      | 105M/299M [00:02<00:05, 37.0MB/s]Downloading pytorch_model.bin:  39%|███▊      | 115M/299M [00:02<00:04, 38.6MB/s]Downloading pytorch_model.bin:  42%|████▏     | 126M/299M [00:02<00:03, 44.9MB/s]Downloading pytorch_model.bin:  46%|████▌     | 136M/299M [00:02<00:03, 52.2MB/s]Downloading pytorch_model.bin:  53%|█████▎    | 157M/299M [00:02<00:02, 59.1MB/s]Downloading pytorch_model.bin:  60%|█████▉    | 178M/299M [00:02<00:01, 71.8MB/s]Downloading pytorch_model.bin:  67%|██████▋   | 199M/299M [00:03<00:01, 81.9MB/s]Downloading pytorch_model.bin:  74%|███████▎  | 220M/299M [00:03<00:00, 89.4MB/s]Downloading pytorch_model.bin:  81%|████████  | 241M/299M [00:03<00:00, 97.5MB/s]Downloading pytorch_model.bin:  88%|████████▊ | 262M/299M [00:03<00:00, 101MB/s] Downloading pytorch_model.bin:  95%|█████████▍| 283M/299M [00:04<00:00, 83.2MB/s]Downloading pytorch_model.bin:  98%|█████████▊| 294M/299M [00:04<00:00, 78.7MB/s]Downloading pytorch_model.bin: 100%|██████████| 299M/299M [00:04<00:00, 69.6MB/s]
+Downloading (…)neration_config.json:   0%|          | 0.00/288 [00:00<?, ?B/s]Downloading (…)neration_config.json: 100%|██████████| 288/288 [00:00<00:00, 845kB/s]
+Downloading (…)okenizer_config.json:   0%|          | 0.00/234 [00:00<?, ?B/s]Downloading (…)okenizer_config.json: 100%|██████████| 234/234 [00:00<00:00, 644kB/s]
+Downloading (…)olve/main/vocab.json:   0%|          | 0.00/2.14k [00:00<?, ?B/s]Downloading (…)olve/main/vocab.json: 100%|██████████| 2.14k/2.14k [00:00<00:00, 5.80MB/s]
+Downloading (…)olve/main/merges.txt:   0%|          | 0.00/60.0 [00:00<?, ?B/s]Downloading (…)olve/main/merges.txt: 100%|██████████| 60.0/60.0 [00:00<00:00, 196kB/s]
+Downloading (…)/main/tokenizer.json:   0%|          | 0.00/5.31k [00:00<?, ?B/s]Downloading (…)/main/tokenizer.json: 100%|██████████| 5.31k/5.31k [00:00<00:00, 12.2MB/s]
+Downloading (…)in/added_tokens.json:   0%|          | 0.00/19.0 [00:00<?, ?B/s]Downloading (…)in/added_tokens.json: 100%|██████████| 19.0/19.0 [00:00<00:00, 63.2kB/s]
+Downloading (…)cial_tokens_map.json:   0%|          | 0.00/123 [00:00<?, ?B/s]Downloading (…)cial_tokens_map.json: 100%|██████████| 123/123 [00:00<00:00, 365kB/s]
diff --git a/myoutput_1551.out b/myoutput_1551.out
deleted file mode 100644
index 922e54b747c5a72439d13ea889cb145b1f78b10a..0000000000000000000000000000000000000000
--- a/myoutput_1551.out
+++ /dev/null
@@ -1 +0,0 @@
-evaluate1
diff --git a/myoutput_1552.out b/myoutput_1552.out
deleted file mode 100644
index 922e54b747c5a72439d13ea889cb145b1f78b10a..0000000000000000000000000000000000000000
--- a/myoutput_1552.out
+++ /dev/null
@@ -1 +0,0 @@
-evaluate1
diff --git a/myoutput_1553.out b/myoutput_1553.out
deleted file mode 100644
index 922e54b747c5a72439d13ea889cb145b1f78b10a..0000000000000000000000000000000000000000
--- a/myoutput_1553.out
+++ /dev/null
@@ -1 +0,0 @@
-evaluate1
diff --git a/myoutput_1554.out b/myoutput_1554.out
deleted file mode 100644
index 922e54b747c5a72439d13ea889cb145b1f78b10a..0000000000000000000000000000000000000000
--- a/myoutput_1554.out
+++ /dev/null
@@ -1 +0,0 @@
-evaluate1
diff --git a/myoutput_1555.out b/myoutput_1555.out
deleted file mode 100644
index 1c5fb65ab4a88e7713dc7837f56a50a607d60f5b..0000000000000000000000000000000000000000
--- a/myoutput_1555.out
+++ /dev/null
@@ -1,5 +0,0 @@
-evaluate1
-trainer train 1
-{'loss': 1.2688, 'learning_rate': 5.380116959064328e-06, 'epoch': 2.19}
-{'train_runtime': 56.3764, 'train_samples_per_second': 388.035, 'train_steps_per_second': 12.133, 'train_loss': 1.1421493842587833, 'epoch': 3.0}
-evaluate 2
diff --git a/myoutput_1556.out b/myoutput_1556.out
deleted file mode 100644
index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..0000000000000000000000000000000000000000
diff --git a/myoutput_1557.out b/myoutput_1557.out
deleted file mode 100644
index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..0000000000000000000000000000000000000000
diff --git a/myoutput_1558.out b/myoutput_1558.out
deleted file mode 100644
index 09b5878576aa3e9dc06ed77a3407d1c5583f61cb..0000000000000000000000000000000000000000
--- a/myoutput_1558.out
+++ /dev/null
@@ -1,4 +0,0 @@
-
-
-
-evaluate1
diff --git a/myoutput_1559.out b/myoutput_1559.out
deleted file mode 100644
index 09b5878576aa3e9dc06ed77a3407d1c5583f61cb..0000000000000000000000000000000000000000
--- a/myoutput_1559.out
+++ /dev/null
@@ -1,4 +0,0 @@
-
-
-
-evaluate1
diff --git a/myoutput_1560.out b/myoutput_1560.out
deleted file mode 100644
index 09b5878576aa3e9dc06ed77a3407d1c5583f61cb..0000000000000000000000000000000000000000
--- a/myoutput_1560.out
+++ /dev/null
@@ -1,4 +0,0 @@
-
-
-
-evaluate1
diff --git a/myoutput_1561.out b/myoutput_1561.out
deleted file mode 100644
index eb09f6afa873df848fd0a0eb3e278a9742a17b7b..0000000000000000000000000000000000000000
--- a/myoutput_1561.out
+++ /dev/null
@@ -1,8 +0,0 @@
-
-
-
-evaluate1
-trainer train 1
-{'loss': 0.6532, 'learning_rate': 5.380116959064328e-06, 'epoch': 2.19}
-{'train_runtime': 57.6599, 'train_samples_per_second': 379.397, 'train_steps_per_second': 11.863, 'train_loss': 0.6262621963233278, 'epoch': 3.0}
-evaluate 2
diff --git a/myoutput_1562.out b/myoutput_1562.out
deleted file mode 100644
index 8dd22693691e971b800f0052a384de97ce0c151a..0000000000000000000000000000000000000000
--- a/myoutput_1562.out
+++ /dev/null
@@ -1,10 +0,0 @@
-
-
-
-evaluate1
-{'eval_loss': 0.5364619493484497, 'eval_bleu': 0.0, 'eval_runtime': 69.2839, 'eval_samples_per_second': 14.448, 'eval_steps_per_second': 0.231}
-trainer train 1
-{'loss': 0.4504, 'learning_rate': 5.380116959064328e-06, 'epoch': 2.19}
-{'train_runtime': 58.3552, 'train_samples_per_second': 374.877, 'train_steps_per_second': 11.721, 'train_loss': 0.4447354879992747, 'epoch': 3.0}
-evaluate 2
-{'eval_loss': 0.411633163690567, 'eval_bleu': 0.0, 'eval_runtime': 68.1275, 'eval_samples_per_second': 14.693, 'eval_steps_per_second': 0.235, 'epoch': 3.0}
diff --git a/myoutput_1563.out b/myoutput_1563.out
deleted file mode 100644
index fafc38ce91e55d184d923be5c49e4da957bb2e30..0000000000000000000000000000000000000000
--- a/myoutput_1563.out
+++ /dev/null
@@ -1,61 +0,0 @@
-
-
-
-MarianMTModel(
-  (model): MarianModel(
-    (shared): Embedding(59514, 512, padding_idx=59513)
-    (encoder): MarianEncoder(
-      (embed_tokens): Embedding(59514, 512, padding_idx=59513)
-      (embed_positions): MarianSinusoidalPositionalEmbedding(512, 512)
-      (layers): ModuleList(
-        (0-5): 6 x MarianEncoderLayer(
-          (self_attn): MarianAttention(
-            (k_proj): Linear(in_features=512, out_features=512, bias=True)
-            (v_proj): Linear(in_features=512, out_features=512, bias=True)
-            (q_proj): Linear(in_features=512, out_features=512, bias=True)
-            (out_proj): Linear(in_features=512, out_features=512, bias=True)
-          )
-          (self_attn_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-          (activation_fn): SiLUActivation()
-          (fc1): Linear(in_features=512, out_features=2048, bias=True)
-          (fc2): Linear(in_features=2048, out_features=512, bias=True)
-          (final_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-        )
-      )
-    )
-    (decoder): MarianDecoder(
-      (embed_tokens): Embedding(59514, 512, padding_idx=59513)
-      (embed_positions): MarianSinusoidalPositionalEmbedding(512, 512)
-      (layers): ModuleList(
-        (0-5): 6 x MarianDecoderLayer(
-          (self_attn): MarianAttention(
-            (k_proj): Linear(in_features=512, out_features=512, bias=True)
-            (v_proj): Linear(in_features=512, out_features=512, bias=True)
-            (q_proj): Linear(in_features=512, out_features=512, bias=True)
-            (out_proj): Linear(in_features=512, out_features=512, bias=True)
-          )
-          (activation_fn): SiLUActivation()
-          (self_attn_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-          (encoder_attn): MarianAttention(
-            (k_proj): Linear(in_features=512, out_features=512, bias=True)
-            (v_proj): Linear(in_features=512, out_features=512, bias=True)
-            (q_proj): Linear(in_features=512, out_features=512, bias=True)
-            (out_proj): Linear(in_features=512, out_features=512, bias=True)
-          )
-          (encoder_attn_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-          (fc1): Linear(in_features=512, out_features=2048, bias=True)
-          (fc2): Linear(in_features=2048, out_features=512, bias=True)
-          (final_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-        )
-      )
-    )
-  )
-  (lm_head): Linear(in_features=512, out_features=59514, bias=False)
-)
-evaluate1
-{'eval_loss': 0.411633163690567, 'eval_bleu': 0.0, 'eval_runtime': 69.9028, 'eval_samples_per_second': 14.32, 'eval_steps_per_second': 0.229}
-trainer train 1
-{'loss': 0.3189, 'learning_rate': 5.380116959064328e-06, 'epoch': 2.19}
-{'train_runtime': 57.9326, 'train_samples_per_second': 377.611, 'train_steps_per_second': 11.807, 'train_loss': 0.3294184054547583, 'epoch': 3.0}
-evaluate 2
-{'eval_loss': 0.33941635489463806, 'eval_bleu': 0.0, 'eval_runtime': 69.4586, 'eval_samples_per_second': 14.411, 'eval_steps_per_second': 0.23, 'epoch': 3.0}
diff --git a/myoutput_1564.out b/myoutput_1564.out
deleted file mode 100644
index 62009c9f2feaa32f1c525995ae26f07e824fdd6a..0000000000000000000000000000000000000000
--- a/myoutput_1564.out
+++ /dev/null
@@ -1,61 +0,0 @@
-
-
-
-MarianMTModel(
-  (model): MarianModel(
-    (shared): Embedding(59514, 512, padding_idx=59513)
-    (encoder): MarianEncoder(
-      (embed_tokens): Embedding(59514, 512, padding_idx=59513)
-      (embed_positions): MarianSinusoidalPositionalEmbedding(512, 512)
-      (layers): ModuleList(
-        (0-5): 6 x MarianEncoderLayer(
-          (self_attn): MarianAttention(
-            (k_proj): Linear(in_features=512, out_features=512, bias=True)
-            (v_proj): Linear(in_features=512, out_features=512, bias=True)
-            (q_proj): Linear(in_features=512, out_features=512, bias=True)
-            (out_proj): Linear(in_features=512, out_features=512, bias=True)
-          )
-          (self_attn_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-          (activation_fn): SiLUActivation()
-          (fc1): Linear(in_features=512, out_features=2048, bias=True)
-          (fc2): Linear(in_features=2048, out_features=512, bias=True)
-          (final_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-        )
-      )
-    )
-    (decoder): MarianDecoder(
-      (embed_tokens): Embedding(59514, 512, padding_idx=59513)
-      (embed_positions): MarianSinusoidalPositionalEmbedding(512, 512)
-      (layers): ModuleList(
-        (0-5): 6 x MarianDecoderLayer(
-          (self_attn): MarianAttention(
-            (k_proj): Linear(in_features=512, out_features=512, bias=True)
-            (v_proj): Linear(in_features=512, out_features=512, bias=True)
-            (q_proj): Linear(in_features=512, out_features=512, bias=True)
-            (out_proj): Linear(in_features=512, out_features=512, bias=True)
-          )
-          (activation_fn): SiLUActivation()
-          (self_attn_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-          (encoder_attn): MarianAttention(
-            (k_proj): Linear(in_features=512, out_features=512, bias=True)
-            (v_proj): Linear(in_features=512, out_features=512, bias=True)
-            (q_proj): Linear(in_features=512, out_features=512, bias=True)
-            (out_proj): Linear(in_features=512, out_features=512, bias=True)
-          )
-          (encoder_attn_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-          (fc1): Linear(in_features=512, out_features=2048, bias=True)
-          (fc2): Linear(in_features=2048, out_features=512, bias=True)
-          (final_layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
-        )
-      )
-    )
-  )
-  (lm_head): Linear(in_features=512, out_features=59514, bias=False)
-)
-evaluate1
-{'eval_loss': 0.3534283936023712, 'eval_bleu': 0.0, 'eval_runtime': 69.9139, 'eval_samples_per_second': 14.318, 'eval_steps_per_second': 0.229}
-trainer train 1
-{'loss': 0.2276, 'learning_rate': 5.380116959064328e-06, 'epoch': 2.19}
-{'train_runtime': 56.8014, 'train_samples_per_second': 385.131, 'train_steps_per_second': 12.042, 'train_loss': 0.2556379162080107, 'epoch': 3.0}
-evaluate 2
-{'eval_loss': 0.30410629510879517, 'eval_bleu': 0.0, 'eval_runtime': 69.9679, 'eval_samples_per_second': 14.307, 'eval_steps_per_second': 0.229, 'epoch': 3.0}
diff --git a/myoutput_1600.out b/myoutput_1600.out
new file mode 100644
index 0000000000000000000000000000000000000000..6d59ba5d6f6fb1c8904c0e39801f7b51fb14ec9d
--- /dev/null
+++ b/myoutput_1600.out
@@ -0,0 +1,8 @@
+evaluate1
+{'eval_loss': 0.3294467329978943, 'eval_bleu': 0.021732338702567133, 'eval_chrf': 24.996195060769814, 'eval_runtime': 70.6427, 'eval_samples_per_second': 14.17, 'eval_steps_per_second': 0.226}
+trainer train 1
+{'loss': 0.2145, 'learning_rate': 5.380116959064328e-06, 'epoch': 2.19}
+{'train_runtime': 56.8334, 'train_samples_per_second': 384.914, 'train_steps_per_second': 12.035, 'train_loss': 0.2377676657068799, 'epoch': 3.0}
+evaluate 2
+{'eval_loss': 0.2867695093154907, 'eval_bleu': 0.02226070832187467, 'eval_chrf': 25.804707746098266, 'eval_runtime': 69.9013, 'eval_samples_per_second': 14.32, 'eval_steps_per_second': 0.229, 'epoch': 3.0}
+training model now
diff --git a/myoutput_1601.out b/myoutput_1601.out
new file mode 100644
index 0000000000000000000000000000000000000000..80b2aa5d20711d87fa0406dc331fa713629fb430
--- /dev/null
+++ b/myoutput_1601.out
@@ -0,0 +1,9 @@
+evaluate1
+{'eval_loss': 0.2867695093154907, 'eval_bleu': 0.02226070832187467, 'eval_chrf': 25.804707746098266, 'eval_runtime': 73.0567, 'eval_samples_per_second': 13.702, 'eval_steps_per_second': 0.219}
+trainer train 1
+{'loss': 0.1428, 'learning_rate': 5.380116959064328e-06, 'epoch': 2.19}
+{'train_runtime': 57.3032, 'train_samples_per_second': 381.759, 'train_steps_per_second': 11.936, 'train_loss': 0.17679918300338657, 'epoch': 3.0}
+evaluate 2
+{'eval_loss': 0.26398155093193054, 'eval_bleu': 0.02310668515912661, 'eval_chrf': 26.48909190811468, 'eval_runtime': 71.4593, 'eval_samples_per_second': 14.008, 'eval_steps_per_second': 0.224, 'epoch': 3.0}
+training model now
+[{'translation_text': 'axinquigudiflogaqueh.aqueh.aqueh.aqueh.aqueh.aqueh.aqueh.aqueh.aqueh.aquaqueh.aqueh.aqueh.aqueh.ah.ah.ah.ah.ac.ah.ac.aquac.aquac.aquaquaquaquaqabah.aqabac.aquaquaquaqababac.ac.ac.ac.ac.ac.aquac.ac.aquac.ac.aquac.caquac.ac.aqac.aqacbaqacbac.aqacaquaqaqubach.aqaqach.aqaqaquhaqaqachbquhbquququququququmabquhaquhaquququququququququququququququmababababababququququququququmabababachbachbachbacqubachchbachbobobachchchchchchchchchchchchchchchchchchchchchchchchbohbohbohdugogogogohgogogogogogogogogogogogogogogogogo'}]
diff --git a/output/added_tokens.json b/output/added_tokens.json
new file mode 100644
index 0000000000000000000000000000000000000000..20fcd9a180a63961398838e6227d85f489eb5b9e
--- /dev/null
+++ b/output/added_tokens.json
@@ -0,0 +1,3 @@
+{
+  "[PAD]": 259
+}
diff --git a/output/config.json b/output/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..ac2930e1df149545af0a5b47c7101e4b6ce592c9
--- /dev/null
+++ b/output/config.json
@@ -0,0 +1,62 @@
+{
+  "_name_or_path": "eng-nah-svo-translation",
+  "_num_labels": 3,
+  "activation_dropout": 0.0,
+  "activation_function": "swish",
+  "add_bias_logits": false,
+  "add_final_layer_norm": false,
+  "architectures": [
+    "MarianMTModel"
+  ],
+  "attention_dropout": 0.0,
+  "bad_words_ids": [
+    [
+      59513
+    ]
+  ],
+  "bos_token_id": 0,
+  "classif_dropout": 0.0,
+  "classifier_dropout": 0.0,
+  "d_model": 512,
+  "decoder_attention_heads": 8,
+  "decoder_ffn_dim": 2048,
+  "decoder_layerdrop": 0.0,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 59513,
+  "decoder_vocab_size": 59514,
+  "dropout": 0.1,
+  "encoder_attention_heads": 8,
+  "encoder_ffn_dim": 2048,
+  "encoder_layerdrop": 0.0,
+  "encoder_layers": 6,
+  "eos_token_id": 0,
+  "forced_eos_token_id": 0,
+  "gradient_checkpointing": false,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "init_std": 0.02,
+  "is_encoder_decoder": true,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "max_length": 512,
+  "max_position_embeddings": 512,
+  "model_type": "marian",
+  "normalize_before": false,
+  "normalize_embedding": false,
+  "num_beams": 4,
+  "num_hidden_layers": 6,
+  "pad_token_id": 59513,
+  "scale_embedding": true,
+  "share_encoder_decoder_embeddings": true,
+  "static_position_embeddings": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.32.1",
+  "use_cache": true,
+  "vocab_size": 59514
+}
diff --git a/output/generation_config.json b/output/generation_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..28de9cc7167cb6cabfab1a0afbf0fabb0717e902
--- /dev/null
+++ b/output/generation_config.json
@@ -0,0 +1,16 @@
+{
+  "bad_words_ids": [
+    [
+      59513
+    ]
+  ],
+  "bos_token_id": 0,
+  "decoder_start_token_id": 59513,
+  "eos_token_id": 0,
+  "forced_eos_token_id": 0,
+  "max_length": 512,
+  "num_beams": 4,
+  "pad_token_id": 59513,
+  "renormalize_logits": true,
+  "transformers_version": "4.32.1"
+}
diff --git a/output/merges.txt b/output/merges.txt
new file mode 100644
index 0000000000000000000000000000000000000000..fcecdc26f2eae6c453a0256e84a1245332d1307c
--- /dev/null
+++ b/output/merges.txt
@@ -0,0 +1,3 @@
+#version: 0.2 - Trained by `huggingface/tokenizers`
+e n
+f r
diff --git a/output/pytorch_model.bin b/output/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..121cd97b7b2dc4ed4df3b6df4d3b8b1996904569
--- /dev/null
+++ b/output/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1696c8d38b79267d54032a50e101760f75a03238ca3b0ac8dea1ce82d3109b0d
+size 298763205
diff --git a/output/special_tokens_map.json b/output/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..342a2f53d97d4a8fe1422d2567e97ba8c525d05d
--- /dev/null
+++ b/output/special_tokens_map.json
@@ -0,0 +1,6 @@
+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "pad_token": "[PAD]",
+  "unk_token": "<|endoftext|>"
+}
diff --git a/output/tokenizer.json b/output/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..3e5da92f3a16a9f960b6c8e3e0f9508c7e607ca5
--- /dev/null
+++ b/output/tokenizer.json
@@ -0,0 +1,317 @@
+{
+  "version": "1.0",
+  "truncation": null,
+  "padding": null,
+  "added_tokens": [
+    {
+      "id": 0,
+      "content": "<|endoftext|>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 259,
+      "content": "[PAD]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    }
+  ],
+  "normalizer": null,
+  "pre_tokenizer": {
+    "type": "ByteLevel",
+    "add_prefix_space": false,
+    "trim_offsets": true,
+    "use_regex": true
+  },
+  "post_processor": {
+    "type": "ByteLevel",
+    "add_prefix_space": true,
+    "trim_offsets": false,
+    "use_regex": true
+  },
+  "decoder": {
+    "type": "ByteLevel",
+    "add_prefix_space": true,
+    "trim_offsets": true,
+    "use_regex": true
+  },
+  "model": {
+    "type": "BPE",
+    "dropout": null,
+    "unk_token": null,
+    "continuing_subword_prefix": "",
+    "end_of_word_suffix": "",
+    "fuse_unk": false,
+    "vocab": {
+      "<|endoftext|>": 0,
+      "!": 1,
+      "\"": 2,
+      "#": 3,
+      "$": 4,
+      "%": 5,
+      "&": 6,
+      "'": 7,
+      "(": 8,
+      ")": 9,
+      "*": 10,
+      "+": 11,
+      ",": 12,
+      "-": 13,
+      ".": 14,
+      "/": 15,
+      "0": 16,
+      "1": 17,
+      "2": 18,
+      "3": 19,
+      "4": 20,
+      "5": 21,
+      "6": 22,
+      "7": 23,
+      "8": 24,
+      "9": 25,
+      ":": 26,
+      ";": 27,
+      "<": 28,
+      "=": 29,
+      ">": 30,
+      "?": 31,
+      "@": 32,
+      "A": 33,
+      "B": 34,
+      "C": 35,
+      "D": 36,
+      "E": 37,
+      "F": 38,
+      "G": 39,
+      "H": 40,
+      "I": 41,
+      "J": 42,
+      "K": 43,
+      "L": 44,
+      "M": 45,
+      "N": 46,
+      "O": 47,
+      "P": 48,
+      "Q": 49,
+      "R": 50,
+      "S": 51,
+      "T": 52,
+      "U": 53,
+      "V": 54,
+      "W": 55,
+      "X": 56,
+      "Y": 57,
+      "Z": 58,
+      "[": 59,
+      "\\": 60,
+      "]": 61,
+      "^": 62,
+      "_": 63,
+      "`": 64,
+      "a": 65,
+      "b": 66,
+      "c": 67,
+      "d": 68,
+      "e": 69,
+      "f": 70,
+      "g": 71,
+      "h": 72,
+      "i": 73,
+      "j": 74,
+      "k": 75,
+      "l": 76,
+      "m": 77,
+      "n": 78,
+      "o": 79,
+      "p": 80,
+      "q": 81,
+      "r": 82,
+      "s": 83,
+      "t": 84,
+      "u": 85,
+      "v": 86,
+      "w": 87,
+      "x": 88,
+      "y": 89,
+      "z": 90,
+      "{": 91,
+      "|": 92,
+      "}": 93,
+      "~": 94,
+      "¡": 95,
+      "¢": 96,
+      "£": 97,
+      "¤": 98,
+      "¥": 99,
+      "¦": 100,
+      "§": 101,
+      "¨": 102,
+      "©": 103,
+      "ª": 104,
+      "«": 105,
+      "¬": 106,
+      "®": 107,
+      "¯": 108,
+      "°": 109,
+      "±": 110,
+      "²": 111,
+      "³": 112,
+      "´": 113,
+      "µ": 114,
+      "¶": 115,
+      "·": 116,
+      "¸": 117,
+      "¹": 118,
+      "º": 119,
+      "»": 120,
+      "¼": 121,
+      "½": 122,
+      "¾": 123,
+      "¿": 124,
+      "À": 125,
+      "Á": 126,
+      "Â": 127,
+      "Ã": 128,
+      "Ä": 129,
+      "Å": 130,
+      "Æ": 131,
+      "Ç": 132,
+      "È": 133,
+      "É": 134,
+      "Ê": 135,
+      "Ë": 136,
+      "Ì": 137,
+      "Í": 138,
+      "Î": 139,
+      "Ï": 140,
+      "Ð": 141,
+      "Ñ": 142,
+      "Ò": 143,
+      "Ó": 144,
+      "Ô": 145,
+      "Õ": 146,
+      "Ö": 147,
+      "×": 148,
+      "Ø": 149,
+      "Ù": 150,
+      "Ú": 151,
+      "Û": 152,
+      "Ü": 153,
+      "Ý": 154,
+      "Þ": 155,
+      "ß": 156,
+      "à": 157,
+      "á": 158,
+      "â": 159,
+      "ã": 160,
+      "ä": 161,
+      "å": 162,
+      "æ": 163,
+      "ç": 164,
+      "è": 165,
+      "é": 166,
+      "ê": 167,
+      "ë": 168,
+      "ì": 169,
+      "í": 170,
+      "î": 171,
+      "ï": 172,
+      "ð": 173,
+      "ñ": 174,
+      "ò": 175,
+      "ó": 176,
+      "ô": 177,
+      "õ": 178,
+      "ö": 179,
+      "÷": 180,
+      "ø": 181,
+      "ù": 182,
+      "ú": 183,
+      "û": 184,
+      "ü": 185,
+      "ý": 186,
+      "þ": 187,
+      "ÿ": 188,
+      "Ā": 189,
+      "ā": 190,
+      "Ă": 191,
+      "ă": 192,
+      "Ą": 193,
+      "ą": 194,
+      "Ć": 195,
+      "ć": 196,
+      "Ĉ": 197,
+      "ĉ": 198,
+      "Ċ": 199,
+      "ċ": 200,
+      "Č": 201,
+      "č": 202,
+      "Ď": 203,
+      "ď": 204,
+      "Đ": 205,
+      "đ": 206,
+      "Ē": 207,
+      "ē": 208,
+      "Ĕ": 209,
+      "ĕ": 210,
+      "Ė": 211,
+      "ė": 212,
+      "Ę": 213,
+      "ę": 214,
+      "Ě": 215,
+      "ě": 216,
+      "Ĝ": 217,
+      "ĝ": 218,
+      "Ğ": 219,
+      "ğ": 220,
+      "Ġ": 221,
+      "ġ": 222,
+      "Ģ": 223,
+      "ģ": 224,
+      "Ĥ": 225,
+      "ĥ": 226,
+      "Ħ": 227,
+      "ħ": 228,
+      "Ĩ": 229,
+      "ĩ": 230,
+      "Ī": 231,
+      "ī": 232,
+      "Ĭ": 233,
+      "ĭ": 234,
+      "Į": 235,
+      "į": 236,
+      "İ": 237,
+      "ı": 238,
+      "Ĳ": 239,
+      "ĳ": 240,
+      "Ĵ": 241,
+      "ĵ": 242,
+      "Ķ": 243,
+      "ķ": 244,
+      "ĸ": 245,
+      "Ĺ": 246,
+      "ĺ": 247,
+      "Ļ": 248,
+      "ļ": 249,
+      "Ľ": 250,
+      "ľ": 251,
+      "Ŀ": 252,
+      "ŀ": 253,
+      "Ł": 254,
+      "ł": 255,
+      "Ń": 256,
+      "en": 257,
+      "fr": 258
+    },
+    "merges": [
+      "e n",
+      "f r"
+    ]
+  }
+}
\ No newline at end of file
diff --git a/output/tokenizer_config.json b/output/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..546efe6d18ae2ad7758d0c9ef51cacdb81c8dc9d
--- /dev/null
+++ b/output/tokenizer_config.json
@@ -0,0 +1,9 @@
+{
+  "add_prefix_space": false,
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "<|endoftext|>",
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}
diff --git a/output/vocab.json b/output/vocab.json
new file mode 100644
index 0000000000000000000000000000000000000000..9cd5bf34d923be02a0eae563f9c595833f08bef3
--- /dev/null
+++ b/output/vocab.json
@@ -0,0 +1 @@
+{"<|endoftext|>":0,"!":1,"\"":2,"#":3,"$":4,"%":5,"&":6,"'":7,"(":8,")":9,"*":10,"+":11,",":12,"-":13,".":14,"/":15,"0":16,"1":17,"2":18,"3":19,"4":20,"5":21,"6":22,"7":23,"8":24,"9":25,":":26,";":27,"<":28,"=":29,">":30,"?":31,"@":32,"A":33,"B":34,"C":35,"D":36,"E":37,"F":38,"G":39,"H":40,"I":41,"J":42,"K":43,"L":44,"M":45,"N":46,"O":47,"P":48,"Q":49,"R":50,"S":51,"T":52,"U":53,"V":54,"W":55,"X":56,"Y":57,"Z":58,"[":59,"\\":60,"]":61,"^":62,"_":63,"`":64,"a":65,"b":66,"c":67,"d":68,"e":69,"f":70,"g":71,"h":72,"i":73,"j":74,"k":75,"l":76,"m":77,"n":78,"o":79,"p":80,"q":81,"r":82,"s":83,"t":84,"u":85,"v":86,"w":87,"x":88,"y":89,"z":90,"{":91,"|":92,"}":93,"~":94,"¡":95,"¢":96,"£":97,"¤":98,"¥":99,"¦":100,"§":101,"¨":102,"©":103,"ª":104,"«":105,"¬":106,"®":107,"¯":108,"°":109,"±":110,"²":111,"³":112,"´":113,"µ":114,"¶":115,"·":116,"¸":117,"¹":118,"º":119,"»":120,"¼":121,"½":122,"¾":123,"¿":124,"À":125,"Á":126,"Â":127,"Ã":128,"Ä":129,"Å":130,"Æ":131,"Ç":132,"È":133,"É":134,"Ê":135,"Ë":136,"Ì":137,"Í":138,"Î":139,"Ï":140,"Ð":141,"Ñ":142,"Ò":143,"Ó":144,"Ô":145,"Õ":146,"Ö":147,"×":148,"Ø":149,"Ù":150,"Ú":151,"Û":152,"Ü":153,"Ý":154,"Þ":155,"ß":156,"à":157,"á":158,"â":159,"ã":160,"ä":161,"å":162,"æ":163,"ç":164,"è":165,"é":166,"ê":167,"ë":168,"ì":169,"í":170,"î":171,"ï":172,"ð":173,"ñ":174,"ò":175,"ó":176,"ô":177,"õ":178,"ö":179,"÷":180,"ø":181,"ù":182,"ú":183,"û":184,"ü":185,"ý":186,"þ":187,"ÿ":188,"Ā":189,"ā":190,"Ă":191,"ă":192,"Ą":193,"ą":194,"Ć":195,"ć":196,"Ĉ":197,"ĉ":198,"Ċ":199,"ċ":200,"Č":201,"č":202,"Ď":203,"ď":204,"Đ":205,"đ":206,"Ē":207,"ē":208,"Ĕ":209,"ĕ":210,"Ė":211,"ė":212,"Ę":213,"ę":214,"Ě":215,"ě":216,"Ĝ":217,"ĝ":218,"Ğ":219,"ğ":220,"Ġ":221,"ġ":222,"Ģ":223,"ģ":224,"Ĥ":225,"ĥ":226,"Ħ":227,"ħ":228,"Ĩ":229,"ĩ":230,"Ī":231,"ī":232,"Ĭ":233,"ĭ":234,"Į":235,"į":236,"İ":237,"ı":238,"Ĳ":239,"ĳ":240,"Ĵ":241,"ĵ":242,"Ķ":243,"ķ":244,"ĸ":245,"Ĺ":246,"ĺ":247,"Ļ":248,"ļ":249,"Ľ":250,"ľ":251,"Ŀ":252,"ŀ":253,"Ł":254,"ł":255,"Ń":256,"en":257,"fr":258}
\ No newline at end of file
diff --git a/synth_translation.py b/synth_translation.py
index 5d2546ae8bd36ecd7eceb891f376f71731c0e9ab..b1701309eba209b877f1c0f3a59a673464322e1a 100644
--- a/synth_translation.py
+++ b/synth_translation.py
@@ -1,6 +1,6 @@
 import transformers
 import numpy as np
-from datasets import load_dataset
+from datasets import load_dataset, DatasetDict
 from transformers import AutoModelForSeq2SeqLM
 from transformers import AutoTokenizer
 from transformers import DataCollatorForSeq2Seq
@@ -17,13 +17,24 @@ from huggingface_hub import Repository, get_full_repo_name
 from tqdm.auto import tqdm
 import torch
 from torch import Tensor
+import os
 
 #load in dataset, setup tokenizer
 
+def addperiod(entry):
+    entry['en'] += '.'
+    entry['fr'] += '.'
+    return entry
+
 raw_datasets = load_dataset("aatherton2024/eng-nah-svo")
+train_ds = raw_datasets['train'].map(addperiod)
+validation_ds = raw_datasets['validation'].map(addperiod)
+test_ds = raw_datasets['test'].map(addperiod)
+
+raw_datasets = DatasetDict({"train" : train_ds, "validation" : validation_ds, "test" : test_ds})
 model_checkpoint = "eng-nah-svo-cpt"
 
-if True:
+if False: #data processing only needs to run once
     def get_training_corpus(raw_datasets):
         return (
             raw_datasets["train"][i : i + 1000]
@@ -37,10 +48,9 @@ if True:
     tokenizer.save_pretrained("eng-nah-svo-cpt")
     tokenizer.push_to_hub("eng-nah-svo-cpt")
 
+max_length = 128
 tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
 tokenizer.add_special_tokens({'pad_token': '[PAD]'})
-#contants
-max_length = 128
 
 #scan dataset, storing lists of english and french words then returning the tokenization of them
 def preprocess_function(examples):
@@ -55,26 +65,27 @@ def preprocess_function(examples):
 tokenized_datasets = raw_datasets.map(
     preprocess_function,
     batched=True,
-    remove_columns=raw_datasets["train"].column_names,
+    remove_columns=raw_datasets["train"].column_names
 )
 
 # #model choice for this problem
-if False:
-    model = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint)
+if False: #load pretrained model
+    model = AutoModelForSeq2SeqLM.from_pretrained("eng-nah-svo-translation")
 
 else:
     from transformers import BertConfig, BertLMHeadModel
     from transformers import AutoModel
 
     model = AutoModelForSeq2SeqLM.from_pretrained("eng-nah-svo-translation")
-    print(model)
-    #model = AutoModelForSeq2SeqLM.from_pretrained("Helsinki-NLP/opus-mt-en-fr")
+
+
 
 #data collator takes tokenizer and the model to deal with padding for dynamic batching
 data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)
 
 #Using BLEU as our metric for this problem
-metric = evaluate.load("sacrebleu")
+metric_bleu = evaluate.load("sacrebleu")
+metric_chrf = evaluate.load("chrf")
 
 #simple method to return test metrics
 def compute_metrics(eval_preds):
@@ -93,8 +104,9 @@ def compute_metrics(eval_preds):
     decoded_preds = [pred.strip() for pred in decoded_preds]
     decoded_labels = [[label.strip()] for label in decoded_labels]
 
-    result = metric.compute(predictions=decoded_preds, references=decoded_labels)
-    return {"bleu": result["score"]}
+    result_bleu = metric_bleu.compute(predictions=decoded_preds, references=decoded_labels)
+    result_chrf = metric_chrf.compute(predictions=decoded_preds, references=decoded_labels)
+    return {"bleu": result_bleu["score"], "chrf": result_chrf["score"]}
 
 ### We now enter the fine-tuning phase of our model structure ###
 
@@ -133,7 +145,8 @@ trainer.train()
 print("evaluate 2")
 print(trainer.evaluate(max_length=max_length))
 trainer.push_to_hub(tags="translation", commit_message="Training complete")
-
+print("training model now")
+model.train()
 
 
 tokenized_datasets.set_format("torch")
@@ -144,7 +157,7 @@ train_dataloader = DataLoader(
     batch_size=8,
 )
 eval_dataloader = DataLoader(
-    tokenized_datasets["test"], collate_fn=data_collator, batch_size=8
+    tokenized_datasets["test"], collate_fn=data_collator, batch_size=8, drop_last=True
 )
 
 model = AutoModelForSeq2SeqLM.from_pretrained("eng-nah-svo-translation")
@@ -197,63 +210,63 @@ def postprocess(predictions, labels):
 
 
 
-progress_bar = tqdm(range(num_training_steps))
-
-for epoch in range(num_train_epochs):
-    # Training
-    model.train()
-    for batch in train_dataloader:
-        outputs = model(**batch)
-        loss = outputs.loss
-        accelerator.backward(loss)
-
-        optimizer.step()
-        lr_scheduler.step()
-        optimizer.zero_grad()
-        progress_bar.update(1)
-
-    # Evaluation
-    model.eval()
-    for batch in tqdm(eval_dataloader):
-        with torch.no_grad():
-            generated_tokens = accelerator.unwrap_model(model).generate(
-                batch["input_ids"],
-                attention_mask=batch["attention_mask"],
-                max_length=128,
-            )
-        labels = batch["labels"]
-
-        # Necessary to pad predictions and labels for being gathered
-        generated_tokens = accelerator.pad_across_processes(
-            generated_tokens, dim=1, pad_index=tokenizer.pad_token_id
-        )
-        labels = accelerator.pad_across_processes(labels, dim=1, pad_index=-100)
+# progress_bar = tqdm(range(num_training_steps))
 
-        predictions_gathered = accelerator.gather(generated_tokens)
-        labels_gathered = accelerator.gather(labels)
+# for epoch in range(num_train_epochs):
+#     # Training
+#     model.train()
+#     for batch in train_dataloader:
+#         outputs = model(**batch)
+#         loss = outputs.loss
+#         accelerator.backward(loss)
 
-        decoded_preds, decoded_labels = postprocess(predictions_gathered, labels_gathered)
-        metric.add_batch(predictions=decoded_preds, references=decoded_labels)
+#         optimizer.step()
+#         lr_scheduler.step()
+#         optimizer.zero_grad()
+#         progress_bar.update(1)
 
-    results = metric.compute()
-    print(f"epoch {epoch}, BLEU score: {results['score']:.2f}")
+#     # Evaluation
+#     model.eval()
+#     for batch in tqdm(eval_dataloader):
+#         with torch.no_grad():
+#             generated_tokens = accelerator.unwrap_model(model).generate(
+#                 batch["input_ids"],
+#                 attention_mask=batch["attention_mask"],
+#                 max_length=128,
+#             )
+#         labels = batch["labels"]
 
-    # Save and upload
-    accelerator.wait_for_everyone()
-    unwrapped_model = accelerator.unwrap_model(model)
-    unwrapped_model.save_pretrained(output_dir, save_function=accelerator.save)
-    if accelerator.is_main_process:
-        tokenizer.save_pretrained(output_dir)
-        repo.push_to_hub(
-            commit_message=f"Training in progress epoch {epoch}", blocking=False
-        )
+#         # Necessary to pad predictions and labels for being gathered
+#         generated_tokens = accelerator.pad_across_processes(
+#             generated_tokens, dim=1, pad_index=tokenizer.pad_token_id
+#         )
+#         labels = accelerator.pad_across_processes(labels, dim=1, pad_index=-100)
+
+#         predictions_gathered = accelerator.gather(generated_tokens)
+#         labels_gathered = accelerator.gather(labels)
+
+#         decoded_preds, decoded_labels = postprocess(predictions_gathered, labels_gathered)
+#         metric_bleu.add_batch(predictions=decoded_preds, references=decoded_labels)
+
+#     results = metric_bleu.compute()
+#     print(f"epoch {epoch}, BLEU score: {results['score']:.2f}")
+
+#     # Save and upload
+#     accelerator.wait_for_everyone()
+#     unwrapped_model = accelerator.unwrap_model(model)
+#     unwrapped_model.save_pretrained(output_dir, save_function=accelerator.save)
+#     if accelerator.is_main_process:
+#         tokenizer.save_pretrained(output_dir)
+#         repo.push_to_hub(
+#             commit_message=f"Training in progress epoch {epoch}", blocking=False
+#         )
 
 
 
 # Replace this with your own checkpoint
-model_checkpoint = "aatherton2024/hf_eng_fra_reproduction"
+model_checkpoint = "aatherton2024/eng-nah-svo-translation"
 translator = pipeline("translation", model=model_checkpoint)
 translator("Default to expanded threads")
-translator(
-    "Unable to import %1 using the OFX importer plugin. This file is not the correct format."
-)
\ No newline at end of file
+print(translator(
+    "you did not frichopize him"
+))
\ No newline at end of file