{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 53, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [ { "type": "Lowercase" }, { "type": "Replace", "pattern": { "Regex": "[^_ abcdefghijklmnopqrstuwxyz\u00e0\u00e1\u00e8\u00e9\u00ec\u00ed\u00f2\u00f3\u00f9\u00fa\u00fc\u0101\u0113\u011b\u012b\u0144\u014d\u016b\u01ce\u01d0\u01d2\u01d4\u01d8\u01da\u01dc\u1e3f]" }, "content": "" }, { "type": "Strip", "strip_left": true, "strip_right": true }, { "type": "Replace", "pattern": { "Regex": "(?=.)|(?": 53 } } }