Upload tokenizer
Browse files- tokenizer.json +6 -4
tokenizer.json
CHANGED
@@ -2,13 +2,13 @@
|
|
2 |
"version": "1.0",
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
-
"max_length":
|
6 |
"strategy": "LongestFirst",
|
7 |
"stride": 0
|
8 |
},
|
9 |
"padding": {
|
10 |
"strategy": {
|
11 |
-
"Fixed":
|
12 |
},
|
13 |
"direction": "Right",
|
14 |
"pad_to_multiple_of": null,
|
@@ -90,7 +90,8 @@
|
|
90 |
{
|
91 |
"type": "Metaspace",
|
92 |
"replacement": "▁",
|
93 |
-
"
|
|
|
94 |
}
|
95 |
]
|
96 |
},
|
@@ -172,7 +173,8 @@
|
|
172 |
"decoder": {
|
173 |
"type": "Metaspace",
|
174 |
"replacement": "▁",
|
175 |
-
"
|
|
|
176 |
},
|
177 |
"model": {
|
178 |
"type": "Unigram",
|
|
|
2 |
"version": "1.0",
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
+
"max_length": 1680,
|
6 |
"strategy": "LongestFirst",
|
7 |
"stride": 0
|
8 |
},
|
9 |
"padding": {
|
10 |
"strategy": {
|
11 |
+
"Fixed": 1680
|
12 |
},
|
13 |
"direction": "Right",
|
14 |
"pad_to_multiple_of": null,
|
|
|
90 |
{
|
91 |
"type": "Metaspace",
|
92 |
"replacement": "▁",
|
93 |
+
"prepend_scheme": "always",
|
94 |
+
"split": true
|
95 |
}
|
96 |
]
|
97 |
},
|
|
|
173 |
"decoder": {
|
174 |
"type": "Metaspace",
|
175 |
"replacement": "▁",
|
176 |
+
"prepend_scheme": "always",
|
177 |
+
"split": true
|
178 |
},
|
179 |
"model": {
|
180 |
"type": "Unigram",
|