End of training
Browse files- tokenizer.json +101 -2
tokenizer.json
CHANGED
@@ -2,13 +2,13 @@
|
|
2 |
"version": "1.0",
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
-
"max_length":
|
6 |
"strategy": "LongestFirst",
|
7 |
"stride": 0
|
8 |
},
|
9 |
"padding": {
|
10 |
"strategy": {
|
11 |
-
"Fixed":
|
12 |
},
|
13 |
"direction": "Right",
|
14 |
"pad_to_multiple_of": null,
|
@@ -943,6 +943,105 @@
|
|
943 |
"rstrip": false,
|
944 |
"normalized": false,
|
945 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
946 |
}
|
947 |
],
|
948 |
"normalizer": {
|
|
|
2 |
"version": "1.0",
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
+
"max_length": 64,
|
6 |
"strategy": "LongestFirst",
|
7 |
"stride": 0
|
8 |
},
|
9 |
"padding": {
|
10 |
"strategy": {
|
11 |
+
"Fixed": 64
|
12 |
},
|
13 |
"direction": "Right",
|
14 |
"pad_to_multiple_of": null,
|
|
|
943 |
"rstrip": false,
|
944 |
"normalized": false,
|
945 |
"special": true
|
946 |
+
},
|
947 |
+
{
|
948 |
+
"id": 32100,
|
949 |
+
"content": "<question>",
|
950 |
+
"single_word": false,
|
951 |
+
"lstrip": false,
|
952 |
+
"rstrip": false,
|
953 |
+
"normalized": true,
|
954 |
+
"special": false
|
955 |
+
},
|
956 |
+
{
|
957 |
+
"id": 32101,
|
958 |
+
"content": "<\\question>",
|
959 |
+
"single_word": false,
|
960 |
+
"lstrip": false,
|
961 |
+
"rstrip": false,
|
962 |
+
"normalized": true,
|
963 |
+
"special": false
|
964 |
+
},
|
965 |
+
{
|
966 |
+
"id": 32102,
|
967 |
+
"content": "<database>",
|
968 |
+
"single_word": false,
|
969 |
+
"lstrip": false,
|
970 |
+
"rstrip": false,
|
971 |
+
"normalized": true,
|
972 |
+
"special": false
|
973 |
+
},
|
974 |
+
{
|
975 |
+
"id": 32103,
|
976 |
+
"content": "<table>",
|
977 |
+
"single_word": false,
|
978 |
+
"lstrip": false,
|
979 |
+
"rstrip": false,
|
980 |
+
"normalized": true,
|
981 |
+
"special": false
|
982 |
+
},
|
983 |
+
{
|
984 |
+
"id": 32104,
|
985 |
+
"content": "<column>",
|
986 |
+
"single_word": false,
|
987 |
+
"lstrip": false,
|
988 |
+
"rstrip": false,
|
989 |
+
"normalized": true,
|
990 |
+
"special": false
|
991 |
+
},
|
992 |
+
{
|
993 |
+
"id": 32105,
|
994 |
+
"content": "<\\database> ",
|
995 |
+
"single_word": false,
|
996 |
+
"lstrip": false,
|
997 |
+
"rstrip": false,
|
998 |
+
"normalized": true,
|
999 |
+
"special": false
|
1000 |
+
},
|
1001 |
+
{
|
1002 |
+
"id": 32106,
|
1003 |
+
"content": "<\table>",
|
1004 |
+
"single_word": false,
|
1005 |
+
"lstrip": false,
|
1006 |
+
"rstrip": false,
|
1007 |
+
"normalized": true,
|
1008 |
+
"special": false
|
1009 |
+
},
|
1010 |
+
{
|
1011 |
+
"id": 32107,
|
1012 |
+
"content": "</non-join>",
|
1013 |
+
"single_word": false,
|
1014 |
+
"lstrip": false,
|
1015 |
+
"rstrip": false,
|
1016 |
+
"normalized": true,
|
1017 |
+
"special": false
|
1018 |
+
},
|
1019 |
+
{
|
1020 |
+
"id": 32108,
|
1021 |
+
"content": "<non-join>",
|
1022 |
+
"single_word": false,
|
1023 |
+
"lstrip": false,
|
1024 |
+
"rstrip": false,
|
1025 |
+
"normalized": true,
|
1026 |
+
"special": false
|
1027 |
+
},
|
1028 |
+
{
|
1029 |
+
"id": 32109,
|
1030 |
+
"content": "</join>",
|
1031 |
+
"single_word": false,
|
1032 |
+
"lstrip": false,
|
1033 |
+
"rstrip": false,
|
1034 |
+
"normalized": true,
|
1035 |
+
"special": false
|
1036 |
+
},
|
1037 |
+
{
|
1038 |
+
"id": 32110,
|
1039 |
+
"content": "<join>",
|
1040 |
+
"single_word": false,
|
1041 |
+
"lstrip": false,
|
1042 |
+
"rstrip": false,
|
1043 |
+
"normalized": true,
|
1044 |
+
"special": false
|
1045 |
}
|
1046 |
],
|
1047 |
"normalizer": {
|