deformer / tokenizer_config.json
Lauler's picture
DeFormer v2.0 de/dem/det/enda/ända support
df5efae
raw
history blame
612 Bytes
{
"do_lower_case": false,
"unk_token": "[UNK]",
"sep_token": "[SEP]",
"pad_token": "[PAD]",
"cls_token": "[CLS]",
"mask_token": "[MASK]",
"tokenize_chinese_chars": true,
"strip_accents": false,
"special_tokens_map_file": "/home/faton/.cache/huggingface/transformers/04a84d173cafb30222a62efc0407878ebf2dc63e1871634cccbd4b68b923b031.dd8bd9bfd3664b530ea4e645105f557769387b3da9f79bdb55ed556bdd80611d",
"name_or_path": "KBLab/bert-base-swedish-cased",
"do_basic_tokenize": true,
"never_split": null,
"tokenizer_class": "BertTokenizer",
"model_max_length": 512
}