{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 43, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [ { "type": "Lowercase" }, { "type": "Replace", "pattern": { "Regex": "[^|n\u00ed\u1ecdi\u00e0\u1eb9tarb\u00ecw\u0301l\u0300k\u00e1s\u00faogmy\u00f3puej\u00f2f\u1e63\u00e9d\u00e8\u00f9\u0144h\\-\u01f9\u2014' ]" }, "content": "" }, { "type": "Strip", "strip_left": true, "strip_right": true }, { "type": "Replace", "pattern": { "Regex": "(?=.)|(?": 43 } } }