cliang1453 commited on
Commit
edb7d1a
1 Parent(s): 06bc862
Files changed (3) hide show
  1. config.json +12 -7
  2. pytorch_model.bin +2 -2
  3. tokenizer.json +0 -0
config.json CHANGED
@@ -1,27 +1,31 @@
1
  {
2
- "_name_or_path": "microsoft/deberta-v3-base",
3
  "architectures": [
4
- "DebertaV2ForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
 
 
 
7
  "finetuning_task": "mrpc",
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
10
  "hidden_size": 768,
11
  "id2label": {
12
- "0": "not_equivalent",
13
- "1": "equivalent"
14
  },
15
  "initializer_range": 0.02,
16
  "intermediate_size": 3072,
17
  "label2id": {
18
- "equivalent": 1,
19
- "not_equivalent": 0
20
  },
21
  "layer_norm_eps": 1e-07,
22
  "max_position_embeddings": 512,
23
  "max_relative_positions": -1,
24
- "model_type": "deberta-v2",
25
  "norm_rel_ebd": "layer_norm",
26
  "num_attention_heads": 12,
27
  "num_hidden_layers": 12,
@@ -38,6 +42,7 @@
38
  "relative_attention": true,
39
  "share_att_key": true,
40
  "torch_dtype": "float32",
 
41
  "transformers_version": "4.28.0",
42
  "type_vocab_size": 0,
43
  "vocab_size": 128100
 
1
  {
2
+ "_name_or_path": "cliang1453/deberta-v3-base-mrpc",
3
  "architectures": [
4
+ "TEDDebertaV2ForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "filter_disabled": false,
8
+ "filter_interval": 1,
9
+ "filter_nonlinear": false,
10
+ "filter_output_dim": null,
11
  "finetuning_task": "mrpc",
12
  "hidden_act": "gelu",
13
  "hidden_dropout_prob": 0.1,
14
  "hidden_size": 768,
15
  "id2label": {
16
+ "0": 0,
17
+ "1": 1
18
  },
19
  "initializer_range": 0.02,
20
  "intermediate_size": 3072,
21
  "label2id": {
22
+ "0": 0,
23
+ "1": 1
24
  },
25
  "layer_norm_eps": 1e-07,
26
  "max_position_embeddings": 512,
27
  "max_relative_positions": -1,
28
+ "model_type": "ted-deberta-v2",
29
  "norm_rel_ebd": "layer_norm",
30
  "num_attention_heads": 12,
31
  "num_hidden_layers": 12,
 
42
  "relative_attention": true,
43
  "share_att_key": true,
44
  "torch_dtype": "float32",
45
+ "train_filters": true,
46
  "transformers_version": "4.28.0",
47
  "type_vocab_size": 0,
48
  "vocab_size": 128100
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01a49d899f91761c4706f1f5603c3b1b4a434d0dbbc87d746e5b8208ab461484
3
- size 737768761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee03c504b8050e8f888fc8253682502e5f151df63aaf0e36aa66d49f72e6226e
3
+ size 794562713
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff