beamaia commited on
Commit
3955f28
1 Parent(s): 757943f

Upload tokenizer

Browse files
Files changed (1) hide show
  1. tokenizer.json +28 -6
tokenizer.json CHANGED
@@ -1,11 +1,6 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 2048,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": null,
10
  "added_tokens": [
11
  {
@@ -76,6 +71,12 @@
76
  "id": "A",
77
  "type_id": 0
78
  }
 
 
 
 
 
 
79
  }
80
  ],
81
  "pair": [
@@ -91,6 +92,12 @@
91
  "type_id": 0
92
  }
93
  },
 
 
 
 
 
 
94
  {
95
  "SpecialToken": {
96
  "id": "<s>",
@@ -102,9 +109,24 @@
102
  "id": "B",
103
  "type_id": 1
104
  }
 
 
 
 
 
 
105
  }
106
  ],
107
  "special_tokens": {
 
 
 
 
 
 
 
 
 
108
  "<s>": {
109
  "id": "<s>",
110
  "ids": [
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
71
  "id": "A",
72
  "type_id": 0
73
  }
74
+ },
75
+ {
76
+ "SpecialToken": {
77
+ "id": "</s>",
78
+ "type_id": 0
79
+ }
80
  }
81
  ],
82
  "pair": [
 
92
  "type_id": 0
93
  }
94
  },
95
+ {
96
+ "SpecialToken": {
97
+ "id": "</s>",
98
+ "type_id": 0
99
+ }
100
+ },
101
  {
102
  "SpecialToken": {
103
  "id": "<s>",
 
109
  "id": "B",
110
  "type_id": 1
111
  }
112
+ },
113
+ {
114
+ "SpecialToken": {
115
+ "id": "</s>",
116
+ "type_id": 1
117
+ }
118
  }
119
  ],
120
  "special_tokens": {
121
+ "</s>": {
122
+ "id": "</s>",
123
+ "ids": [
124
+ 2
125
+ ],
126
+ "tokens": [
127
+ "</s>"
128
+ ]
129
+ },
130
  "<s>": {
131
  "id": "<s>",
132
  "ids": [