KoichiYasuoka commited on
Commit
df69051
1 Parent(s): 0359194

常用漢字 support

Browse files
Files changed (1) hide show
  1. tokenizer.json +29 -1
tokenizer.json CHANGED
@@ -76,6 +76,34 @@
76
  "Regex": " {2,}"
77
  },
78
  "content": " "
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
79
  }
80
  ]
81
  },
@@ -128170,4 +128198,4 @@
128170
  ]
128171
  ]
128172
  }
128173
- }
76
  "Regex": " {2,}"
77
  },
78
  "content": " "
79
+ },
80
+ {
81
+ "type": "Replace",
82
+ "pattern": {
83
+ "String": "𠮟"
84
+ },
85
+ "content": "叱"
86
+ },
87
+ {
88
+ "type": "Replace",
89
+ "pattern": {
90
+ "String": "塡"
91
+ },
92
+ "content": "填"
93
+ },
94
+ {
95
+ "type": "Replace",
96
+ "pattern": {
97
+ "String": "剝"
98
+ },
99
+ "content": "剥"
100
+ },
101
+ {
102
+ "type": "Replace",
103
+ "pattern": {
104
+ "String": "頰"
105
+ },
106
+ "content": "頬"
107
  }
108
  ]
109
  },
128198
  ]
128199
  ]
128200
  }
128201
+ }