{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 34, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [ { "type": "Lowercase" }, { "type": "Replace", "pattern": { "String": "\u021b" }, "content": "\u0163" }, { "type": "Replace", "pattern": { "Regex": "[^cqubg_n\u2013mzitl\u0103f\u0219a1\u00eep\\-hs'xej\u00e2 rvo\u0163d]" }, "content": "" }, { "type": "Strip", "strip_left": true, "strip_right": true }, { "type": "Replace", "pattern": { "Regex": "(?=.)|(?": 34 } } }