{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 44, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [ { "type": "Lowercase" }, { "type": "Replace", "pattern": { "Regex": "[^\u00eez\\-\u00f9u\u00fby\u00e8xqcg\u00f4\u00ea_eidbaf\u0153hr\u00e9ksv\u00e0 \u2013p\u00ebtnoj\u00fc\u00e2\u00e7\u00ef'ml]" }, "content": "" }, { "type": "Strip", "strip_left": true, "strip_right": true }, { "type": "Replace", "pattern": { "Regex": "(?=.)|(?": 44 } } }