Upload 8 files

New Model with token limit 1024

Files changed (4) hide show

merges.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-#version: 0.2 - Trained by `huggingface/tokenizers`
 Ã Ń
 Ã ¡
 Ġ p

+#version: 0.2
 Ã Ń
 Ã ¡
 Ġ p

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ae6532129654abe85ad03f722bd48af118bebd5d733e6d8b910d9c6d0086b12f
 size 510398013

 version https://git-lfs.github.com/spec/v1
+oid sha256:32a567f19d1007dfde526c36eeb570acc2ac2bc49adb8e630d2257dad8c6b2a2
 size 510398013

tokenizer.json CHANGED Viewed

@@ -1,6 +1,11 @@
 {
   "version": "1.0",
-  "truncation": null,
   "padding": null,
   "added_tokens": [
     {
@@ -39,6 +44,7 @@
     "continuing_subword_prefix": "",
     "end_of_word_suffix": "",
     "fuse_unk": false,
     "vocab": {
       "<|endoftext|>": 0,
       "!": 1,

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 1024,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
   "padding": null,
   "added_tokens": [
     {
     "continuing_subword_prefix": "",
     "end_of_word_suffix": "",
     "fuse_unk": false,
+    "byte_fallback": false,
     "vocab": {
       "<|endoftext|>": 0,
       "!": 1,

tokenizer_config.json CHANGED Viewed

@@ -18,7 +18,7 @@
     "single_word": false
   },
   "errors": "replace",
-  "model_max_length": 512,
   "pad_token": {
     "__type": "AddedToken",
     "content": "<|endoftext|>",

     "single_word": false
   },
   "errors": "replace",
+  "model_max_length": 1024,
   "pad_token": {
     "__type": "AddedToken",
     "content": "<|endoftext|>",