midav commited on
Commit
e066cac
1 Parent(s): d625543

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +50 -3
config.json CHANGED
@@ -1,8 +1,43 @@
1
  {
2
  "_name_or_path": "roberta-base",
3
  "adapters": {
4
- "adapters": {},
5
- "config_map": {},
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  "fusion_config_map": {},
7
  "fusions": {}
8
  },
@@ -25,7 +60,19 @@
25
  "num_hidden_layers": 12,
26
  "pad_token_id": 1,
27
  "position_embedding_type": "absolute",
28
- "prediction_heads": {},
 
 
 
 
 
 
 
 
 
 
 
 
29
  "torch_dtype": "float32",
30
  "transformers_version": "4.21.3",
31
  "type_vocab_size": 1,
1
  {
2
  "_name_or_path": "roberta-base",
3
  "adapters": {
4
+ "adapters": {
5
+ "quartz": "9076f36a74755ac4"
6
+ },
7
+ "config_map": {
8
+ "9076f36a74755ac4": {
9
+ "adapter_residual_before_ln": false,
10
+ "cross_adapter": false,
11
+ "factorized_phm_W": true,
12
+ "factorized_phm_rule": false,
13
+ "hypercomplex_nonlinearity": "glorot-uniform",
14
+ "init_weights": "bert",
15
+ "inv_adapter": null,
16
+ "inv_adapter_reduction_factor": null,
17
+ "is_parallel": false,
18
+ "learn_phm": true,
19
+ "leave_out": [],
20
+ "ln_after": false,
21
+ "ln_before": false,
22
+ "mh_adapter": false,
23
+ "non_linearity": "relu",
24
+ "original_ln_after": true,
25
+ "original_ln_before": true,
26
+ "output_adapter": true,
27
+ "phm_bias": true,
28
+ "phm_c_init": "normal",
29
+ "phm_dim": 4,
30
+ "phm_init_range": 0.0001,
31
+ "phm_layer": false,
32
+ "phm_rank": 1,
33
+ "reduction_factor": 16,
34
+ "residual_before_ln": true,
35
+ "scaling": 1.0,
36
+ "shared_W_phm": false,
37
+ "shared_phm_rule": true,
38
+ "use_gating": false
39
+ }
40
+ },
41
  "fusion_config_map": {},
42
  "fusions": {}
43
  },
60
  "num_hidden_layers": 12,
61
  "pad_token_id": 1,
62
  "position_embedding_type": "absolute",
63
+ "prediction_heads": {
64
+ "quartz": {
65
+ "activation_function": "tanh",
66
+ "head_type": "multiple_choice",
67
+ "label2id": {
68
+ "A": 0,
69
+ "B": 1
70
+ },
71
+ "layers": 2,
72
+ "num_choices": 2,
73
+ "use_pooler": false
74
+ }
75
+ },
76
  "torch_dtype": "float32",
77
  "transformers_version": "4.21.3",
78
  "type_vocab_size": 1,