Whalejay commited on
Commit
12554df
1 Parent(s): 1c39e54

Upload BertForQuestionAnswering

Browse files
Files changed (3) hide show
  1. README.md +10 -11
  2. config.json +16 -16
  3. model.safetensors +2 -2
README.md CHANGED
@@ -9,25 +9,24 @@ license: mit
9
  datasets:
10
  - squad
11
  pipeline_tag: question-answering
12
-
13
  model-index:
14
  - name: bert-sliding-window_epoch_1
15
  results:
16
- - task:
17
  type: question-answering
18
  name: Question Answering
19
- metrics:
20
- - type: exact_match
21
- value: N/A # You can update this with actual metrics if available
22
- name: Exact Match
23
- - type: f1
24
- value: N/A # You can update this with actual metrics if available
25
- name: F1
26
  dataset:
27
  name: SQuAD
28
  type: squad
29
- config: plain_text # Adding the config field
30
- split: validation # Adding the split field
 
 
 
 
 
 
 
31
  ---
32
 
33
  # bert-sliding-window_epoch_1
 
9
  datasets:
10
  - squad
11
  pipeline_tag: question-answering
 
12
  model-index:
13
  - name: bert-sliding-window_epoch_1
14
  results:
15
+ - task:
16
  type: question-answering
17
  name: Question Answering
 
 
 
 
 
 
 
18
  dataset:
19
  name: SQuAD
20
  type: squad
21
+ config: plain_text
22
+ split: validation
23
+ metrics:
24
+ - type: exact_match
25
+ value: N/A
26
+ name: Exact Match
27
+ - type: f1
28
+ value: N/A
29
+ name: F1
30
  ---
31
 
32
  # bert-sliding-window_epoch_1
config.json CHANGED
@@ -1,25 +1,25 @@
1
  {
2
- "_name_or_path": "Whalejay/bert-sliding-window_epoch_3",
3
- "activation": "gelu",
4
  "architectures": [
5
- "DistilBertForQuestionAnswering"
6
  ],
7
- "attention_dropout": 0.1,
8
- "dim": 768,
9
- "dropout": 0.1,
10
- "hidden_dim": 3072,
 
11
  "initializer_range": 0.02,
 
 
12
  "max_position_embeddings": 512,
13
- "model_type": "distilbert",
14
- "n_heads": 12,
15
- "n_layers": 6,
16
- "output_past": true,
17
  "pad_token_id": 0,
18
- "qa_dropout": 0.1,
19
- "seq_classif_dropout": 0.2,
20
- "sinusoidal_pos_embds": true,
21
- "tie_weights_": true,
22
  "torch_dtype": "float32",
23
  "transformers_version": "4.46.0",
24
- "vocab_size": 28996
 
 
25
  }
 
1
  {
2
+ "_name_or_path": "bert-large-uncased-whole-word-masking-finetuned-squad",
 
3
  "architectures": [
4
+ "BertForQuestionAnswering"
5
  ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 1024,
11
  "initializer_range": 0.02,
12
+ "intermediate_size": 4096,
13
+ "layer_norm_eps": 1e-12,
14
  "max_position_embeddings": 512,
15
+ "model_type": "bert",
16
+ "num_attention_heads": 16,
17
+ "num_hidden_layers": 24,
 
18
  "pad_token_id": 0,
19
+ "position_embedding_type": "absolute",
 
 
 
20
  "torch_dtype": "float32",
21
  "transformers_version": "4.46.0",
22
+ "type_vocab_size": 2,
23
+ "use_cache": true,
24
+ "vocab_size": 30522
25
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22a26473edb71e4f992af3c63cd9a7937e00fcaba80c186f00431bb7d2ffdb9b
3
- size 260782152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48c71317e65868aa101024f9c4c2cec0ae5e054acee63757e63e0ce73393b00d
3
+ size 1336424168