{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 60, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [ { "type": "Lowercase" }, { "type": "Replace", "pattern": { "Regex": "[^|\u0abe\u0ac7\u0aa4\u0aa8\u0ab0\u0acd\u0aae\u0ac0\u0a95\u0a82\u0acb\u0aaa\u0ab5\u0ac1\u0ab8\u0aaf\u0ab9\u0a9c\u0aa5\u0abf\u0ab6\u0aa3\u0a9b\u0ab2\u0aa6\u0a86\u0a93\u0a85\u0a8f\u0a88\u0aac\u0a97\u0a96\u0aa7\u0aad\u0a9f\u0ab3\u0ac2\u0a9a\u0aa1\u0ab7\u0a89\u0aab\u0a98\u0aa0\u0ac3'\u0a8a\u0a87\u0a9e\u0a9d\u0aa2\u0ac8\u0a83\u0acc\\-\u0a8b\u0a90 ]" }, "content": "" }, { "type": "Strip", "strip_left": true, "strip_right": true }, { "type": "Replace", "pattern": { "Regex": "(?=.)|(?": 60 } } }