|
{ |
|
"added_tokens_decoder": { |
|
"0": { |
|
"content": "<pad>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"1": { |
|
"content": "<unk>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"2": { |
|
"content": "[CLS]", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"3": { |
|
"content": "[SEP]", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"4": { |
|
"content": "[MASK]", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"5": { |
|
"content": "(", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"6": { |
|
"content": ")", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"7": { |
|
"content": "”", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"8": { |
|
"content": "\"", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"9": { |
|
"content": "-", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"10": { |
|
"content": ".", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"11": { |
|
"content": "–", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"12": { |
|
"content": "!", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"13": { |
|
"content": ":", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"14": { |
|
"content": "?", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"15": { |
|
"content": "/", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"16": { |
|
"content": ";", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"17": { |
|
"content": "'", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"18": { |
|
"content": "`", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"19": { |
|
"content": "[", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"20": { |
|
"content": "]", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"21": { |
|
"content": "£", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"22": { |
|
"content": "€", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"23": { |
|
"content": "$", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"24": { |
|
"content": "*", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"25": { |
|
"content": "%", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"26": { |
|
"content": "&", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"27": { |
|
"content": "=", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"28": { |
|
"content": "+", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
} |
|
}, |
|
"bos_token": "[CLS]", |
|
"clean_up_tokenization_spaces": false, |
|
"cls_token": "[CLS]", |
|
"do_lower_case": false, |
|
"eos_token": "[SEP]", |
|
"keep_accents": true, |
|
"mask_token": "[MASK]", |
|
"model_max_length": 512, |
|
"pad_token": "<pad>", |
|
"remove_space": true, |
|
"sep_token": "[SEP]", |
|
"sp_model_kwargs": {}, |
|
"tokenizer_class": "AlbertTokenizer", |
|
"unk_token": "<unk>" |
|
} |
|
|