kochan13 commited on
Commit
7d44290
1 Parent(s): e5bb408

Upload 4 files

Browse files
gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "</s|LLM-jp>"
4
+ ],
5
+ "bos_token": "<s|LLM-jp>",
6
+ "cls_token": "<CLS|LLM-jp>",
7
+ "eod_token": "<EOD|LLM-jp>",
8
+ "eos_token": "<EOD|LLM-jp>",
9
+ "mask_token": "<mask|LLM-jp>",
10
+ "pad_token": "<pad|LLM-jp>",
11
+ "sep_token": "<SEP|LLM-jp>",
12
+ "unk_token": "<unk|LLM-jp>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "unk_token": "<unk|LLM-jp>",
3
+ "bos_token": "<s|LLM-jp>",
4
+ "eos_token": "<EOD|LLM-jp>",
5
+ "pad_token": "<pad|LLM-jp>",
6
+ "cls_token": "<CLS|LLM-jp>",
7
+ "sep_token": "<SEP|LLM-jp>",
8
+ "eod_token": "<EOD|LLM-jp>",
9
+ "mask_token": "<mask|LLM-jp>",
10
+ "extra_ids": 0,
11
+ "additional_special_tokens": [
12
+ "</s|LLM-jp>"
13
+ ],
14
+ "sp_model_kwargs": {},
15
+ "model_max_length": 1000000000000000019884624838656,
16
+ "clean_up_tokenization_spaces": false,
17
+ "special_tokens_map_file": null,
18
+ "tokenizer_class": "PreTrainedTokenizerFast"
19
+ }