solotimes commited on
Commit
55e7392
0 Parent(s):
.gitattributes ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ftz filter=lfs diff=lfs merge=lfs -text
6
+ *.gz filter=lfs diff=lfs merge=lfs -text
7
+ *.h5 filter=lfs diff=lfs merge=lfs -text
8
+ *.joblib filter=lfs diff=lfs merge=lfs -text
9
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
10
+ *.model filter=lfs diff=lfs merge=lfs -text
11
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
12
+ *.npy filter=lfs diff=lfs merge=lfs -text
13
+ *.npz filter=lfs diff=lfs merge=lfs -text
14
+ *.onnx filter=lfs diff=lfs merge=lfs -text
15
+ *.ot filter=lfs diff=lfs merge=lfs -text
16
+ *.parquet filter=lfs diff=lfs merge=lfs -text
17
+ *.pb filter=lfs diff=lfs merge=lfs -text
18
+ *.pickle filter=lfs diff=lfs merge=lfs -text
19
+ *.pkl filter=lfs diff=lfs merge=lfs -text
20
+ *.pt filter=lfs diff=lfs merge=lfs -text
21
+ *.pth filter=lfs diff=lfs merge=lfs -text
22
+ *.rar filter=lfs diff=lfs merge=lfs -text
23
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
24
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
25
+ *.tflite filter=lfs diff=lfs merge=lfs -text
26
+ *.tgz filter=lfs diff=lfs merge=lfs -text
27
+ *.wasm filter=lfs diff=lfs merge=lfs -text
28
+ *.xz filter=lfs diff=lfs merge=lfs -text
29
+ *.zip filter=lfs diff=lfs merge=lfs -text
30
+ *.zstandard filter=lfs diff=lfs merge=lfs -text
31
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ ---
2
+ license: mit
3
+ ---
added_tokens.json ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<s_iitcdip>": 57523,
3
+ "<s_lavibe-base>": 57525,
4
+ "<s_synthdog>": 57524,
5
+ "<sep/>": 57522,
6
+ "伪": 57619,
7
+ "估": 57528,
8
+ "俞": 57598,
9
+ "债": 57610,
10
+ "偶": 57573,
11
+ "偿": 57541,
12
+ "兑": 57621,
13
+ "册": 57580,
14
+ "况": 57531,
15
+ "凤": 57609,
16
+ "刁": 57537,
17
+ "劝": 57590,
18
+ "匹": 57554,
19
+ "卸": 57568,
20
+ "厢": 57607,
21
+ "叉": 57577,
22
+ "吕": 57558,
23
+ "址": 57538,
24
+ "培": 57536,
25
+ "塘": 57605,
26
+ "够": 57587,
27
+ "央": 57546,
28
+ "姜": 57602,
29
+ "娟": 57601,
30
+ "娱": 57566,
31
+ "娶": 57542,
32
+ "婕": 57616,
33
+ "履": 57556,
34
+ "峡": 57603,
35
+ "崔": 57578,
36
+ "弃": 57595,
37
+ "弢": 57617,
38
+ "循": 57571,
39
+ "怖": 57560,
40
+ "怡": 57625,
41
+ "愁": 57608,
42
+ "披": 57526,
43
+ "担": 57593,
44
+ "摘": 57572,
45
+ "撑": 57592,
46
+ "擅": 57594,
47
+ "旦": 57549,
48
+ "旭": 57583,
49
+ "晰": 57618,
50
+ "朋": 57543,
51
+ "构": 57567,
52
+ "析": 57553,
53
+ "栋": 57575,
54
+ "橘": 57615,
55
+ "殊": 57591,
56
+ "毫": 57552,
57
+ "沟": 57596,
58
+ "泄": 57581,
59
+ "浅": 57623,
60
+ "济": 57570,
61
+ "涛": 57628,
62
+ "滚": 57539,
63
+ "滤": 57597,
64
+ "滨": 57545,
65
+ "灌": 57562,
66
+ "烦": 57532,
67
+ "烯": 57551,
68
+ "焕": 57557,
69
+ "皓": 57534,
70
+ "确": 57620,
71
+ "磊": 57547,
72
+ "绍": 57612,
73
+ "绕": 57600,
74
+ "综": 57613,
75
+ "缠": 57604,
76
+ "罚": 57563,
77
+ "翠": 57527,
78
+ "艳": 57550,
79
+ "芯": 57627,
80
+ "葛": 57569,
81
+ "蕾": 57574,
82
+ "螺": 57586,
83
+ "裕": 57624,
84
+ "裸": 57629,
85
+ "詹": 57529,
86
+ "训": 57589,
87
+ "询": 57599,
88
+ "诱": 57533,
89
+ "贤": 57606,
90
+ "赔": 57614,
91
+ "辆": 57535,
92
+ "辉": 57579,
93
+ "辐": 57588,
94
+ "辖": 57548,
95
+ "递": 57559,
96
+ "郑": 57626,
97
+ "郝": 57564,
98
+ "释": 57555,
99
+ "鑫": 57530,
100
+ "铭": 57544,
101
+ "链": 57611,
102
+ "际": 57540,
103
+ "陷": 57622,
104
+ "雇": 57582,
105
+ "颜": 57585,
106
+ "验": 57561,
107
+ "鸣": 57565,
108
+ "鼎": 57584,
109
+ "龚": 57576
110
+ }
config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "align_long_axis": true,
3
+ "architectures": [
4
+ "DonutModel"
5
+ ],
6
+ "decoder_layer": 4,
7
+ "encoder_layer": [
8
+ 2,
9
+ 2,
10
+ 14,
11
+ 2
12
+ ],
13
+ "input_size": [
14
+ 2560,
15
+ 1920
16
+ ],
17
+ "max_length": 1536,
18
+ "max_position_embeddings": 1536,
19
+ "model_type": "donut",
20
+ "torch_dtype": "float32",
21
+ "transformers_version": "4.11.3",
22
+ "window_size": 10
23
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d21e8b5e708168f4f9885d18f8bc95ad6950439e7ac518161828ff0b27b984e8
3
+ size 1018458179
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb9e3dce4c326195d08fc3dd0f7e2eee1da8595c847bf4c1a9c78b7a82d47e2d
3
+ size 1296245
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true}, "additional_special_tokens": ["<s_iitcdip>", "<s_synthdog>"]}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "sp_model_kwargs": {}, "special_tokens_map_file": null, "tokenizer_file": "/root/.cache/huggingface/transformers/213c2041358e63047b407f94cde1ae23904d31a3bceb57eab291028c1e949437.7135a4b25ac726e19641f0d68803ff02bad960d6319064f55fa9c536929b86fc", "name_or_path": "hyunwoongko/asian-bart-ecjk", "tokenizer_class": "XLMRobertaTokenizer"}