BengaliSentencePieceBPETokenizer / tokenizer_config.json
faisaltareque's picture
Upload tokenizer
198d4f4
raw
history blame contribute delete
433 Bytes
{
"model_max_length": 1024,
"name_or_path": "/home/shohan/Dev/PlayGround/BanglaTokenizer/BengaliSentencePieceBPETokenizerFast",
"special_tokens": [
"<s>",
"<pad>",
"</s>",
"<unk>",
"<cls>",
"<sep>",
"<mask>"
],
"special_tokens_map_file": "/home/shohan/Dev/PlayGround/BanglaTokenizer/BengaliSentencePieceBPETokenizerFast/special_tokens_map.json",
"tokenizer_class": "PreTrainedTokenizerFast"
}