devpranjal commited on
Commit
2e0329c
1 Parent(s): 5f45e86

Upload DebertaV2ForQuestionAnswering

Browse files
Files changed (2) hide show
  1. config.json +7 -1
  2. pytorch_model.bin +1 -1
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "deberta-v3-base-devrev-data",
3
  "architectures": [
4
  "DebertaV2ForQuestionAnswering"
5
  ],
@@ -9,10 +9,12 @@
9
  "hidden_size": 768,
10
  "initializer_range": 0.02,
11
  "intermediate_size": 3072,
 
12
  "layer_norm_eps": 1e-07,
13
  "max_position_embeddings": 512,
14
  "max_relative_positions": -1,
15
  "model_type": "deberta-v2",
 
16
  "norm_rel_ebd": "layer_norm",
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
@@ -28,6 +30,10 @@
28
  "position_buckets": 256,
29
  "relative_attention": true,
30
  "share_att_key": true,
 
 
 
 
31
  "torch_dtype": "float32",
32
  "transformers_version": "4.26.0",
33
  "type_vocab_size": 0,
 
1
  {
2
+ "_name_or_path": "deepset/deberta-v3-base-squad2",
3
  "architectures": [
4
  "DebertaV2ForQuestionAnswering"
5
  ],
 
9
  "hidden_size": 768,
10
  "initializer_range": 0.02,
11
  "intermediate_size": 3072,
12
+ "language": "english",
13
  "layer_norm_eps": 1e-07,
14
  "max_position_embeddings": 512,
15
  "max_relative_positions": -1,
16
  "model_type": "deberta-v2",
17
+ "name": "DebertaV2",
18
  "norm_rel_ebd": "layer_norm",
19
  "num_attention_heads": 12,
20
  "num_hidden_layers": 12,
 
30
  "position_buckets": 256,
31
  "relative_attention": true,
32
  "share_att_key": true,
33
+ "summary_activation": "tanh",
34
+ "summary_last_dropout": 0,
35
+ "summary_type": "first",
36
+ "summary_use_proj": false,
37
  "torch_dtype": "float32",
38
  "transformers_version": "4.26.0",
39
  "type_vocab_size": 0,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e01cc0b34732b377b2e604f8eb2170e52041f4e9c7ed11bf859982eb5161077b
3
  size 735402993
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:184e22f9d6d6f6b82d2ac0907850ae3347f3c92ecdedfc12cedbb82c425abbd0
3
  size 735402993