Commit
•
8c7bdd1
1
Parent(s):
759ae03
Upload tokenizer.json
Browse files- tokenizer.json +12 -3
tokenizer.json
CHANGED
@@ -99,6 +99,15 @@
|
|
99 |
"tokens": [
|
100 |
"<s>"
|
101 |
]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
102 |
}
|
103 |
}
|
104 |
},
|
@@ -129,11 +138,11 @@
|
|
129 |
"model": {
|
130 |
"type": "BPE",
|
131 |
"dropout": null,
|
132 |
-
"unk_token":
|
133 |
"continuing_subword_prefix": null,
|
134 |
"end_of_word_suffix": null,
|
135 |
-
"fuse_unk":
|
136 |
-
"byte_fallback":
|
137 |
"vocab": {
|
138 |
"<unk>": 0,
|
139 |
"<s>": 1,
|
|
|
99 |
"tokens": [
|
100 |
"<s>"
|
101 |
]
|
102 |
+
},
|
103 |
+
"</s>": {
|
104 |
+
"id": "</s>",
|
105 |
+
"ids": [
|
106 |
+
2
|
107 |
+
],
|
108 |
+
"tokens": [
|
109 |
+
"</s>"
|
110 |
+
]
|
111 |
}
|
112 |
}
|
113 |
},
|
|
|
138 |
"model": {
|
139 |
"type": "BPE",
|
140 |
"dropout": null,
|
141 |
+
"unk_token": null,
|
142 |
"continuing_subword_prefix": null,
|
143 |
"end_of_word_suffix": null,
|
144 |
+
"fuse_unk": false,
|
145 |
+
"byte_fallback": false,
|
146 |
"vocab": {
|
147 |
"<unk>": 0,
|
148 |
"<s>": 1,
|