Joshua Lochner commited on
Commit
6f165a0
1 Parent(s): c31883a

Add `distilbert` and `mobilebert` models for zero-shot classification

Browse files
Files changed (24) hide show
  1. quantized/typeform/distilbert-base-uncased-mnli/default/config.json +34 -0
  2. quantized/typeform/distilbert-base-uncased-mnli/default/model.onnx +3 -0
  3. quantized/typeform/distilbert-base-uncased-mnli/default/special_tokens_map.json +7 -0
  4. quantized/typeform/distilbert-base-uncased-mnli/default/tokenizer.json +0 -0
  5. quantized/typeform/distilbert-base-uncased-mnli/default/tokenizer_config.json +15 -0
  6. quantized/typeform/distilbert-base-uncased-mnli/default/vocab.txt +0 -0
  7. quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/config.json +34 -0
  8. quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/model.onnx +3 -0
  9. quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/special_tokens_map.json +7 -0
  10. quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/tokenizer.json +0 -0
  11. quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/tokenizer_config.json +15 -0
  12. quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/vocab.txt +0 -0
  13. quantized/typeform/mobilebert-uncased-mnli/default/config.json +43 -0
  14. quantized/typeform/mobilebert-uncased-mnli/default/model.onnx +3 -0
  15. quantized/typeform/mobilebert-uncased-mnli/default/special_tokens_map.json +7 -0
  16. quantized/typeform/mobilebert-uncased-mnli/default/tokenizer.json +0 -0
  17. quantized/typeform/mobilebert-uncased-mnli/default/tokenizer_config.json +15 -0
  18. quantized/typeform/mobilebert-uncased-mnli/default/vocab.txt +0 -0
  19. quantized/typeform/mobilebert-uncased-mnli/sequence-classification/config.json +43 -0
  20. quantized/typeform/mobilebert-uncased-mnli/sequence-classification/model.onnx +3 -0
  21. quantized/typeform/mobilebert-uncased-mnli/sequence-classification/special_tokens_map.json +7 -0
  22. quantized/typeform/mobilebert-uncased-mnli/sequence-classification/tokenizer.json +0 -0
  23. quantized/typeform/mobilebert-uncased-mnli/sequence-classification/tokenizer_config.json +15 -0
  24. quantized/typeform/mobilebert-uncased-mnli/sequence-classification/vocab.txt +0 -0
quantized/typeform/distilbert-base-uncased-mnli/default/config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "typeform/distilbert-base-uncased-mnli",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "finetuning_task": "mnli",
11
+ "hidden_dim": 3072,
12
+ "id2label": {
13
+ "0": "ENTAILMENT",
14
+ "1": "NEUTRAL",
15
+ "2": "CONTRADICTION"
16
+ },
17
+ "initializer_range": 0.02,
18
+ "label2id": {
19
+ "CONTRADICTION": 2,
20
+ "ENTAILMENT": 0,
21
+ "NEUTRAL": 1
22
+ },
23
+ "max_position_embeddings": 512,
24
+ "model_type": "distilbert",
25
+ "n_heads": 12,
26
+ "n_layers": 6,
27
+ "pad_token_id": 0,
28
+ "qa_dropout": 0.1,
29
+ "seq_classif_dropout": 0.2,
30
+ "sinusoidal_pos_embds": false,
31
+ "tie_weights_": true,
32
+ "transformers_version": "4.27.3",
33
+ "vocab_size": 30522
34
+ }
quantized/typeform/distilbert-base-uncased-mnli/default/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4dd478572f0a8440857a24b84fb71126974ac4ee8b9be03718711011cead53b
3
+ size 66960030
quantized/typeform/distilbert-base-uncased-mnli/default/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
quantized/typeform/distilbert-base-uncased-mnli/default/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
quantized/typeform/distilbert-base-uncased-mnli/default/tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": true,
5
+ "mask_token": "[MASK]",
6
+ "model_max_length": 512,
7
+ "never_split": null,
8
+ "pad_token": "[PAD]",
9
+ "sep_token": "[SEP]",
10
+ "special_tokens_map_file": null,
11
+ "strip_accents": null,
12
+ "tokenize_chinese_chars": true,
13
+ "tokenizer_class": "DistilBertTokenizer",
14
+ "unk_token": "[UNK]"
15
+ }
quantized/typeform/distilbert-base-uncased-mnli/default/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "typeform/distilbert-base-uncased-mnli",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "finetuning_task": "mnli",
11
+ "hidden_dim": 3072,
12
+ "id2label": {
13
+ "0": "ENTAILMENT",
14
+ "1": "NEUTRAL",
15
+ "2": "CONTRADICTION"
16
+ },
17
+ "initializer_range": 0.02,
18
+ "label2id": {
19
+ "CONTRADICTION": 2,
20
+ "ENTAILMENT": 0,
21
+ "NEUTRAL": 1
22
+ },
23
+ "max_position_embeddings": 512,
24
+ "model_type": "distilbert",
25
+ "n_heads": 12,
26
+ "n_layers": 6,
27
+ "pad_token_id": 0,
28
+ "qa_dropout": 0.1,
29
+ "seq_classif_dropout": 0.2,
30
+ "sinusoidal_pos_embds": false,
31
+ "tie_weights_": true,
32
+ "transformers_version": "4.27.3",
33
+ "vocab_size": 30522
34
+ }
quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f5b4dc1fe4ca3975d3ab5d915e8729c42c7c38fb7ce57802fdc62daf086ed95
3
+ size 67598558
quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": true,
5
+ "mask_token": "[MASK]",
6
+ "model_max_length": 512,
7
+ "never_split": null,
8
+ "pad_token": "[PAD]",
9
+ "sep_token": "[SEP]",
10
+ "special_tokens_map_file": null,
11
+ "strip_accents": null,
12
+ "tokenize_chinese_chars": true,
13
+ "tokenizer_class": "DistilBertTokenizer",
14
+ "unk_token": "[UNK]"
15
+ }
quantized/typeform/distilbert-base-uncased-mnli/sequence-classification/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
quantized/typeform/mobilebert-uncased-mnli/default/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "typeform/mobilebert-uncased-mnli",
3
+ "architectures": [
4
+ "MobileBertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_activation": false,
8
+ "classifier_dropout": null,
9
+ "embedding_size": 128,
10
+ "finetuning_task": "mnli",
11
+ "hidden_act": "relu",
12
+ "hidden_dropout_prob": 0.0,
13
+ "hidden_size": 512,
14
+ "id2label": {
15
+ "0": "ENTAILMENT",
16
+ "1": "NEUTRAL",
17
+ "2": "CONTRADICTION"
18
+ },
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 512,
21
+ "intra_bottleneck_size": 128,
22
+ "key_query_shared_bottleneck": true,
23
+ "label2id": {
24
+ "CONTRADICTION": 2,
25
+ "ENTAILMENT": 0,
26
+ "NEUTRAL": 1
27
+ },
28
+ "layer_norm_eps": 1e-12,
29
+ "max_position_embeddings": 512,
30
+ "model_type": "mobilebert",
31
+ "normalization_type": "no_norm",
32
+ "num_attention_heads": 4,
33
+ "num_feedforward_networks": 4,
34
+ "num_hidden_layers": 24,
35
+ "pad_token_id": 0,
36
+ "transformers_version": "4.27.3",
37
+ "trigram_input": true,
38
+ "true_hidden_size": 128,
39
+ "type_vocab_size": 2,
40
+ "use_bottleneck": true,
41
+ "use_bottleneck_attention": false,
42
+ "vocab_size": 30522
43
+ }
quantized/typeform/mobilebert-uncased-mnli/default/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e8f2cec941c93e022d453ef291750f22bd70c3a0b7ebc842e4f37e98bf084c2
3
+ size 26920927
quantized/typeform/mobilebert-uncased-mnli/default/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
quantized/typeform/mobilebert-uncased-mnli/default/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
quantized/typeform/mobilebert-uncased-mnli/default/tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": true,
5
+ "mask_token": "[MASK]",
6
+ "model_max_length": 1000000000000000019884624838656,
7
+ "never_split": null,
8
+ "pad_token": "[PAD]",
9
+ "sep_token": "[SEP]",
10
+ "special_tokens_map_file": null,
11
+ "strip_accents": null,
12
+ "tokenize_chinese_chars": true,
13
+ "tokenizer_class": "MobileBertTokenizer",
14
+ "unk_token": "[UNK]"
15
+ }
quantized/typeform/mobilebert-uncased-mnli/default/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
quantized/typeform/mobilebert-uncased-mnli/sequence-classification/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "typeform/mobilebert-uncased-mnli",
3
+ "architectures": [
4
+ "MobileBertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_activation": false,
8
+ "classifier_dropout": null,
9
+ "embedding_size": 128,
10
+ "finetuning_task": "mnli",
11
+ "hidden_act": "relu",
12
+ "hidden_dropout_prob": 0.0,
13
+ "hidden_size": 512,
14
+ "id2label": {
15
+ "0": "ENTAILMENT",
16
+ "1": "NEUTRAL",
17
+ "2": "CONTRADICTION"
18
+ },
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 512,
21
+ "intra_bottleneck_size": 128,
22
+ "key_query_shared_bottleneck": true,
23
+ "label2id": {
24
+ "CONTRADICTION": 2,
25
+ "ENTAILMENT": 0,
26
+ "NEUTRAL": 1
27
+ },
28
+ "layer_norm_eps": 1e-12,
29
+ "max_position_embeddings": 512,
30
+ "model_type": "mobilebert",
31
+ "normalization_type": "no_norm",
32
+ "num_attention_heads": 4,
33
+ "num_feedforward_networks": 4,
34
+ "num_hidden_layers": 24,
35
+ "pad_token_id": 0,
36
+ "transformers_version": "4.27.3",
37
+ "trigram_input": true,
38
+ "true_hidden_size": 128,
39
+ "type_vocab_size": 2,
40
+ "use_bottleneck": true,
41
+ "use_bottleneck_attention": false,
42
+ "vocab_size": 30522
43
+ }
quantized/typeform/mobilebert-uncased-mnli/sequence-classification/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f75c35149501b9fb15a68358ca3a29d0f88b06e8dd7956ce5f34fca167d45cb7
3
+ size 27149640
quantized/typeform/mobilebert-uncased-mnli/sequence-classification/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
quantized/typeform/mobilebert-uncased-mnli/sequence-classification/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
quantized/typeform/mobilebert-uncased-mnli/sequence-classification/tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": true,
5
+ "mask_token": "[MASK]",
6
+ "model_max_length": 1000000000000000019884624838656,
7
+ "never_split": null,
8
+ "pad_token": "[PAD]",
9
+ "sep_token": "[SEP]",
10
+ "special_tokens_map_file": null,
11
+ "strip_accents": null,
12
+ "tokenize_chinese_chars": true,
13
+ "tokenizer_class": "MobileBertTokenizer",
14
+ "unk_token": "[UNK]"
15
+ }
quantized/typeform/mobilebert-uncased-mnli/sequence-classification/vocab.txt ADDED
The diff for this file is too large to render. See raw diff