Phương commited on
Commit
ec4e187
·
1 Parent(s): 3b746d6

Upload tokenizer_config(1).json

Browse files
Files changed (1) hide show
  1. tokenizer_config(1).json +12 -0
tokenizer_config(1).json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<start>",
3
+ "clean_up_tokenization_spaces": true,
4
+ "eos_token": "<end>",
5
+ "model_input_names": [
6
+ "input_ids"
7
+ ],
8
+ "model_max_length": 1000000000000000019884624838656,
9
+ "pad_token": "<pad>",
10
+ "tokenizer_class": "PreTrainedTokenizerFast",
11
+ "unk_token": "<pad>"
12
+ }