update
Browse files
README.md
CHANGED
@@ -44,6 +44,26 @@ The copyright of the datasets belongs to the Institute of Linguistics, Academia
|
|
44 |
```python
|
45 |
>>> from transformers import pipeline
|
46 |
>>> unmasker = pipeline('fill-mask', model='ckiplab/oldhan-bert-base-chinese')
|
47 |
-
>>> unmasker("
|
48 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
49 |
```
|
|
|
44 |
```python
|
45 |
>>> from transformers import pipeline
|
46 |
>>> unmasker = pipeline('fill-mask', model='ckiplab/oldhan-bert-base-chinese')
|
47 |
+
>>> unmasker("้ป[MASK]ๆผ่ฎๆ้ใ")
|
48 |
|
49 |
+
[{'sequence': '้ป ๆฐ ๆผ ่ฎ ๆ ้ ใ',
|
50 |
+
'score': 0.14885780215263367,
|
51 |
+
'token': 3696,
|
52 |
+
'token_str': 'ๆฐ'},
|
53 |
+
{'sequence': '้ป ๅบถ ๆผ ่ฎ ๆ ้ ใ',
|
54 |
+
'score': 0.0859643816947937,
|
55 |
+
'token': 2433,
|
56 |
+
'token_str': 'ๅบถ'},
|
57 |
+
{'sequence': '้ป ๆฐ ๆผ ่ฎ ๆ ้ ใ',
|
58 |
+
'score': 0.027848130092024803,
|
59 |
+
'token': 3694,
|
60 |
+
'token_str': 'ๆฐ'},
|
61 |
+
{'sequence': '้ป ไบบ ๆผ ่ฎ ๆ ้ ใ',
|
62 |
+
'score': 0.023678112775087357,
|
63 |
+
'token': 782,
|
64 |
+
'token_str': 'ไบบ'},
|
65 |
+
{'sequence': '้ป ็ ๆผ ่ฎ ๆ ้ ใ',
|
66 |
+
'score': 0.018718384206295013,
|
67 |
+
'token': 4495,
|
68 |
+
'token_str': '็'}]
|
69 |
```
|