codebyzeb commited on
Commit
792f6de
1 Parent(s): 19e859b

Upload tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer.json +2 -2
  2. tokenizer_config.json +2 -2
tokenizer.json CHANGED
@@ -22,8 +22,8 @@
22
  "special": true
23
  },
24
  {
25
- "id": 31,
26
- "content": "<|endoftext|>",
27
  "single_word": false,
28
  "lstrip": false,
29
  "rstrip": false,
 
22
  "special": true
23
  },
24
  {
25
+ "id": 5,
26
+ "content": "UTT_BOUNDARY",
27
  "single_word": false,
28
  "lstrip": false,
29
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -17,8 +17,8 @@
17
  "single_word": false,
18
  "special": true
19
  },
20
- "31": {
21
- "content": "<|endoftext|>",
22
  "lstrip": false,
23
  "normalized": false,
24
  "rstrip": false,
 
17
  "single_word": false,
18
  "special": true
19
  },
20
+ "5": {
21
+ "content": "UTT_BOUNDARY",
22
  "lstrip": false,
23
  "normalized": false,
24
  "rstrip": false,