cased model
Browse files- added_tokens.json +0 -1
- config.json +1 -1
- flax_model.msgpack +2 -2
- tokenizer.json +0 -0
- tokenizer_config.json +1 -1
- vocab.txt +0 -0
added_tokens.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"</s>": 50136, "<s>": 50135}
|
|
|
|
config.json
CHANGED
@@ -23,5 +23,5 @@
|
|
23 |
"tie_word_embeddings": false,
|
24 |
"transformers_version": "4.16.2",
|
25 |
"use_cache": true,
|
26 |
-
"vocab_size":
|
27 |
}
|
|
|
23 |
"tie_word_embeddings": false,
|
24 |
"transformers_version": "4.16.2",
|
25 |
"use_cache": true,
|
26 |
+
"vocab_size": 54343
|
27 |
}
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba8690145741abefa5160a5918228bbb0058494b83d5daa5a4101f1d4a0555cf
|
3 |
+
size 1126812575
|
tokenizer.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "do_basic_tokenize": true, "never_split": null, "
|
|
|
1 |
+
{"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "do_basic_tokenize": true, "never_split": null, "special_tokens_map_file": "KcT5-base-cased/special_tokens_map.json", "name_or_path": "KcT5-base-cased", "tokenizer_class": "BertTokenizer"}
|
vocab.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|