{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 72, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [ { "type": "Lowercase" }, { "type": "Replace", "pattern": { "Regex": "[^\u092b41\\-\u0905\u09078 0\u091b\u0928\u090f\u0910\u093c\u0937\u093f\u0901\u091a2\u0911\u0925\u092d\u0940\u200d\u09453\u091e\u0948\u0941\u0920\u0902\u0949\u0909_\u0908\u0903\u0939\u0927\u0932\u0930\u0938\u092c\u0916\u0923'`\u0935\u0918\u092a\u0917\u0922\u092f\u0947\u094d\u093e\u0906\u0921\u091c\u091d\u0936\u0914\u094b\u0926\u0943\u094c\u090a\u0942\u0913\u091f\u0924\u0915\u092e]" }, "content": "" }, { "type": "Strip", "strip_left": true, "strip_right": true }, { "type": "Replace", "pattern": { "Regex": "(?=.)|(?": 72 } } }