beomi commited on
Commit
41e857a
1 Parent(s): 06e3fed

cased model

Browse files
added_tokens.json DELETED
@@ -1 +0,0 @@
1
- {"</s>": 50136, "<s>": 50135}
 
 
config.json CHANGED
@@ -23,5 +23,5 @@
23
  "tie_word_embeddings": false,
24
  "transformers_version": "4.16.2",
25
  "use_cache": true,
26
- "vocab_size": 50137
27
  }
 
23
  "tie_word_embeddings": false,
24
  "transformers_version": "4.16.2",
25
  "use_cache": true,
26
+ "vocab_size": 54343
27
  }
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c767ae78a06b8f8fee6505d22f317dacd20d395190ae11fc77059ce887fc1be
3
- size 1100970911
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba8690145741abefa5160a5918228bbb0058494b83d5daa5a4101f1d4a0555cf
3
+ size 1126812575
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "do_basic_tokenize": true, "never_split": null, "model_max_length": 512, "special_tokens_map_file": "/home/beomi/.cache/huggingface/transformers/6bddca875f34b8afbae26136b9594ea80793c9598640f0bc94017555a0a1c113.31b83c6ab34462cefd974ed0df8dd4189e7b7b81b47315b7a10627f7ae120002", "name_or_path": "./KcT5-base", "tokenizer_class": "BertTokenizer"}
 
1
+ {"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "do_basic_tokenize": true, "never_split": null, "special_tokens_map_file": "KcT5-base-cased/special_tokens_map.json", "name_or_path": "KcT5-base-cased", "tokenizer_class": "BertTokenizer"}
vocab.txt CHANGED
The diff for this file is too large to render. See raw diff