Xenova HF staff commited on
Commit
12ad3f9
1 Parent(s): 5b67340

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "sshleifer/distilbart-cnn-12-3",
3
+ "_num_labels": 3,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "gelu",
6
+ "add_bias_logits": false,
7
+ "add_final_layer_norm": false,
8
+ "architectures": [
9
+ "BartForConditionalGeneration"
10
+ ],
11
+ "attention_dropout": 0.0,
12
+ "bos_token_id": 0,
13
+ "classif_dropout": 0.0,
14
+ "classifier_dropout": 0.0,
15
+ "d_model": 1024,
16
+ "decoder_attention_heads": 16,
17
+ "decoder_ffn_dim": 4096,
18
+ "decoder_layerdrop": 0.0,
19
+ "decoder_layers": 3,
20
+ "decoder_start_token_id": 2,
21
+ "dropout": 0.1,
22
+ "early_stopping": true,
23
+ "encoder_attention_heads": 16,
24
+ "encoder_ffn_dim": 4096,
25
+ "encoder_layerdrop": 0.0,
26
+ "encoder_layers": 12,
27
+ "eos_token_id": 2,
28
+ "extra_pos_embeddings": 2,
29
+ "force_bos_token_to_be_generated": true,
30
+ "forced_bos_token_id": 0,
31
+ "forced_eos_token_id": 2,
32
+ "gradient_checkpointing": false,
33
+ "id2label": {
34
+ "0": "LABEL_0",
35
+ "1": "LABEL_1",
36
+ "2": "LABEL_2"
37
+ },
38
+ "init_std": 0.02,
39
+ "is_encoder_decoder": true,
40
+ "label2id": {
41
+ "LABEL_0": 0,
42
+ "LABEL_1": 1,
43
+ "LABEL_2": 2
44
+ },
45
+ "length_penalty": 2.0,
46
+ "max_length": 142,
47
+ "max_position_embeddings": 1024,
48
+ "min_length": 56,
49
+ "model_type": "bart",
50
+ "no_repeat_ngram_size": 3,
51
+ "normalize_before": false,
52
+ "normalize_embedding": true,
53
+ "num_beams": 4,
54
+ "num_hidden_layers": 12,
55
+ "output_past": true,
56
+ "pad_token_id": 1,
57
+ "prefix": " ",
58
+ "save_step": 14,
59
+ "scale_embedding": false,
60
+ "static_position_embeddings": false,
61
+ "task_specific_params": {
62
+ "summarization": {
63
+ "early_stopping": true,
64
+ "length_penalty": 2.0,
65
+ "max_length": 142,
66
+ "min_length": 56,
67
+ "no_repeat_ngram_size": 3,
68
+ "num_beams": 4
69
+ }
70
+ },
71
+ "transformers_version": "4.34.0.dev0",
72
+ "use_cache": true,
73
+ "vocab_size": 50264
74
+ }
generation_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "decoder_start_token_id": 2,
5
+ "early_stopping": true,
6
+ "eos_token_id": 2,
7
+ "forced_bos_token_id": 0,
8
+ "forced_eos_token_id": 2,
9
+ "length_penalty": 2.0,
10
+ "max_length": 142,
11
+ "min_length": 56,
12
+ "no_repeat_ngram_size": 3,
13
+ "num_beams": 4,
14
+ "pad_token_id": 1,
15
+ "transformers_version": "4.34.0.dev0"
16
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10379ca97f436cdf9aa6c67aa65c10c47c458347e73fdba181a5377117059176
3
+ size 412005107
onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e5a9018ec849577de51f544dad70a0476d06a3d011571817ed39c31b6094d03
3
+ size 412134082
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdc72a62e632643c6f187d03214f3f6f577bfc543070a57c2d2cee87628c599b
3
+ size 103937351
onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08bbac385e49d1abe308592c320fde3e8b656c6da2812dce72a690f9f973994d
3
+ size 103735466
onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e2679d1b876997e1e96a3fea7b5b91116a067ae0bd60c4fda525bc2725eee4c
3
+ size 386790644
onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c06e4f5f0fd6aa2addc90e211fd3972c47ce56b338457aac9239373095ee8ebe
3
+ size 97349834
onnx/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7b0f1c0a7de98749bbafc2360fba831736a20af875a208307a28745f2dc51ed
3
+ size 814942257
onnx/encoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:859513ea514dc9b43d975efca26f5b40b4c529eb874ab9e4df9165b50dc6f3d1
3
+ size 205100092
quantize_config.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "decoder_model": {
6
+ "op_types": [
7
+ "Unsqueeze",
8
+ "Where",
9
+ "Sub",
10
+ "Cast",
11
+ "Less",
12
+ "Softmax",
13
+ "Sqrt",
14
+ "ReduceMean",
15
+ "ConstantOfShape",
16
+ "Add",
17
+ "Transpose",
18
+ "Gather",
19
+ "Mul",
20
+ "Expand",
21
+ "Pow",
22
+ "Erf",
23
+ "Range",
24
+ "Squeeze",
25
+ "Div",
26
+ "Constant",
27
+ "Reshape",
28
+ "Shape",
29
+ "Equal",
30
+ "Slice",
31
+ "MatMul",
32
+ "Concat"
33
+ ],
34
+ "weight_type": "QInt8"
35
+ },
36
+ "encoder_model": {
37
+ "op_types": [
38
+ "Unsqueeze",
39
+ "Where",
40
+ "Sub",
41
+ "Cast",
42
+ "Softmax",
43
+ "Sqrt",
44
+ "ReduceMean",
45
+ "ConstantOfShape",
46
+ "Add",
47
+ "Transpose",
48
+ "Gather",
49
+ "Mul",
50
+ "Expand",
51
+ "Pow",
52
+ "Erf",
53
+ "Range",
54
+ "Div",
55
+ "Constant",
56
+ "Reshape",
57
+ "Shape",
58
+ "Equal",
59
+ "MatMul",
60
+ "Concat"
61
+ ],
62
+ "weight_type": "QInt8"
63
+ },
64
+ "decoder_model_merged": {
65
+ "op_types": [
66
+ "Unsqueeze",
67
+ "Where",
68
+ "Sub",
69
+ "Cast",
70
+ "Less",
71
+ "Softmax",
72
+ "Sqrt",
73
+ "ReduceMean",
74
+ "ConstantOfShape",
75
+ "Add",
76
+ "Transpose",
77
+ "Gather",
78
+ "Mul",
79
+ "Expand",
80
+ "Pow",
81
+ "Erf",
82
+ "Range",
83
+ "Squeeze",
84
+ "Div",
85
+ "Constant",
86
+ "Reshape",
87
+ "Shape",
88
+ "Equal",
89
+ "Slice",
90
+ "MatMul",
91
+ "Concat",
92
+ "If"
93
+ ],
94
+ "weight_type": "QInt8"
95
+ },
96
+ "decoder_with_past_model": {
97
+ "op_types": [
98
+ "Unsqueeze",
99
+ "Where",
100
+ "Sub",
101
+ "Cast",
102
+ "Softmax",
103
+ "Sqrt",
104
+ "ReduceMean",
105
+ "ConstantOfShape",
106
+ "Add",
107
+ "Transpose",
108
+ "Gather",
109
+ "Mul",
110
+ "Expand",
111
+ "Pow",
112
+ "Erf",
113
+ "Range",
114
+ "Div",
115
+ "Constant",
116
+ "Reshape",
117
+ "Shape",
118
+ "Equal",
119
+ "MatMul",
120
+ "Concat"
121
+ ],
122
+ "weight_type": "QInt8"
123
+ }
124
+ }
125
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
15
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": {
4
+ "__type": "AddedToken",
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ "clean_up_tokenization_spaces": true,
12
+ "cls_token": {
13
+ "__type": "AddedToken",
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": true,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ },
20
+ "eos_token": {
21
+ "__type": "AddedToken",
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": true,
25
+ "rstrip": false,
26
+ "single_word": false
27
+ },
28
+ "errors": "replace",
29
+ "mask_token": {
30
+ "__type": "AddedToken",
31
+ "content": "<mask>",
32
+ "lstrip": true,
33
+ "normalized": true,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "model_max_length": 1024,
38
+ "pad_token": {
39
+ "__type": "AddedToken",
40
+ "content": "<pad>",
41
+ "lstrip": false,
42
+ "normalized": true,
43
+ "rstrip": false,
44
+ "single_word": false
45
+ },
46
+ "sep_token": {
47
+ "__type": "AddedToken",
48
+ "content": "</s>",
49
+ "lstrip": false,
50
+ "normalized": true,
51
+ "rstrip": false,
52
+ "single_word": false
53
+ },
54
+ "tokenizer_class": "BartTokenizer",
55
+ "trim_offsets": true,
56
+ "unk_token": {
57
+ "__type": "AddedToken",
58
+ "content": "<unk>",
59
+ "lstrip": false,
60
+ "normalized": true,
61
+ "rstrip": false,
62
+ "single_word": false
63
+ }
64
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff