Vedx04 commited on
Commit
94ca911
·
verified ·
1 Parent(s): 4080de0

Upload tokenizer

Browse files
Files changed (3) hide show
  1. tokenizer.json +0 -0
  2. tokenizer.model +2 -2
  3. tokenizer_config.json +2 -1
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
- size 499723
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
tokenizer_config.json CHANGED
@@ -28,10 +28,11 @@
28
  "special": true
29
  }
30
  },
 
31
  "bos_token": "<s>",
32
  "clean_up_tokenization_spaces": false,
33
  "eos_token": "</s>",
34
- "legacy": false,
35
  "model_max_length": 1000000000000000019884624838656,
36
  "pad_token": "</s>",
37
  "padding_side": "left",
 
28
  "special": true
29
  }
30
  },
31
+ "additional_special_tokens": [],
32
  "bos_token": "<s>",
33
  "clean_up_tokenization_spaces": false,
34
  "eos_token": "</s>",
35
+ "legacy": true,
36
  "model_max_length": 1000000000000000019884624838656,
37
  "pad_token": "</s>",
38
  "padding_side": "left",