historical-irish-tokenizer-wordpiece / tokenizer_config.json
ancatmara's picture
Upload 3 files
a20b2c8 verified
raw
history blame contribute delete
235 Bytes
{
"clean_up_tokenization_spaces": true,
"model_max_length": 64,
"special_tokens": [
"<s>",
"<pad>",
"</s>",
"<unk>",
"<mask>",
"<true>",
"<false>"
],
"tokenizer_class": "PreTrainedTokenizerFast"
}