fix post_processor ids
Browse files- tokenizer.json +4 -4
tokenizer.json
CHANGED
@@ -104,12 +104,12 @@
|
|
104 |
"post_processor": {
|
105 |
"type": "RobertaProcessing",
|
106 |
"sep": [
|
107 |
-
"
|
108 |
-
|
109 |
],
|
110 |
"cls": [
|
111 |
-
"<
|
112 |
-
|
113 |
],
|
114 |
"trim_offsets": true,
|
115 |
"add_prefix_space": false
|
|
|
104 |
"post_processor": {
|
105 |
"type": "RobertaProcessing",
|
106 |
"sep": [
|
107 |
+
"<EOT>",
|
108 |
+
0
|
109 |
],
|
110 |
"cls": [
|
111 |
+
"<bos>",
|
112 |
+
65002
|
113 |
],
|
114 |
"trim_offsets": true,
|
115 |
"add_prefix_space": false
|