JustinLin610
commited on
Commit
•
e58a774
1
Parent(s):
535391d
Upload folder using huggingface_hub
Browse files- tokenizer.json +33 -3
- tokenizer.model +2 -2
tokenizer.json
CHANGED
@@ -37,7 +37,7 @@
|
|
37 |
"lstrip": false,
|
38 |
"rstrip": false,
|
39 |
"normalized": false,
|
40 |
-
"special":
|
41 |
},
|
42 |
{
|
43 |
"id": 4,
|
@@ -46,7 +46,7 @@
|
|
46 |
"lstrip": false,
|
47 |
"rstrip": false,
|
48 |
"normalized": false,
|
49 |
-
"special":
|
50 |
},
|
51 |
{
|
52 |
"id": 5,
|
@@ -12512,6 +12512,33 @@
|
|
12512 |
"rstrip": false,
|
12513 |
"normalized": false,
|
12514 |
"special": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12515 |
}
|
12516 |
],
|
12517 |
"normalizer": {
|
@@ -104857,7 +104884,10 @@
|
|
104857 |
"<fim_prefix>": 92295,
|
104858 |
"<fim_middle>": 92296,
|
104859 |
"<fim_suffix>": 92297,
|
104860 |
-
"<fim_pad>": 92298
|
|
|
|
|
|
|
104861 |
},
|
104862 |
"merges": [
|
104863 |
"▁ t",
|
|
|
37 |
"lstrip": false,
|
38 |
"rstrip": false,
|
39 |
"normalized": false,
|
40 |
+
"special": true
|
41 |
},
|
42 |
{
|
43 |
"id": 4,
|
|
|
46 |
"lstrip": false,
|
47 |
"rstrip": false,
|
48 |
"normalized": false,
|
49 |
+
"special": true
|
50 |
},
|
51 |
{
|
52 |
"id": 5,
|
|
|
12512 |
"rstrip": false,
|
12513 |
"normalized": false,
|
12514 |
"special": false
|
12515 |
+
},
|
12516 |
+
{
|
12517 |
+
"id": 92299,
|
12518 |
+
"content": "<repo_name>",
|
12519 |
+
"single_word": false,
|
12520 |
+
"lstrip": false,
|
12521 |
+
"rstrip": false,
|
12522 |
+
"normalized": false,
|
12523 |
+
"special": false
|
12524 |
+
},
|
12525 |
+
{
|
12526 |
+
"id": 92300,
|
12527 |
+
"content": "<file_sep>",
|
12528 |
+
"single_word": false,
|
12529 |
+
"lstrip": false,
|
12530 |
+
"rstrip": false,
|
12531 |
+
"normalized": false,
|
12532 |
+
"special": false
|
12533 |
+
},
|
12534 |
+
{
|
12535 |
+
"id": 92301,
|
12536 |
+
"content": "<|extra_0|>",
|
12537 |
+
"single_word": false,
|
12538 |
+
"lstrip": false,
|
12539 |
+
"rstrip": false,
|
12540 |
+
"normalized": false,
|
12541 |
+
"special": false
|
12542 |
}
|
12543 |
],
|
12544 |
"normalizer": {
|
|
|
104884 |
"<fim_prefix>": 92295,
|
104885 |
"<fim_middle>": 92296,
|
104886 |
"<fim_suffix>": 92297,
|
104887 |
+
"<fim_pad>": 92298,
|
104888 |
+
"<repo_name>": 92299,
|
104889 |
+
"<file_sep>": 92300,
|
104890 |
+
"<|extra_0|>": 92301
|
104891 |
},
|
104892 |
"merges": [
|
104893 |
"▁ t",
|
tokenizer.model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:656b66a920a54bc45e8e06dc587691ab3c0b2930b9ae56d5fa31e72db2f3bff3
|
3 |
+
size 1423961
|