Shushant commited on
Commit
f4fe8bf
1 Parent(s): 959a426

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,35 +1,28 @@
1
  {
2
- "_name_or_path": "microsoft/deberta-v3-large",
3
  "architectures": [
4
- "DebertaV2ForQuestionAnswering"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
 
 
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
  "hidden_size": 1024,
10
  "initializer_range": 0.02,
11
  "intermediate_size": 4096,
12
- "layer_norm_eps": 1e-07,
13
  "max_position_embeddings": 512,
14
- "max_relative_positions": -1,
15
- "model_type": "deberta-v2",
16
- "norm_rel_ebd": "layer_norm",
17
  "num_attention_heads": 16,
18
  "num_hidden_layers": 24,
 
19
  "pad_token_id": 0,
20
- "pooler_dropout": 0,
21
- "pooler_hidden_act": "gelu",
22
- "pooler_hidden_size": 1024,
23
- "pos_att_type": [
24
- "p2c",
25
- "c2p"
26
- ],
27
- "position_biased_input": false,
28
- "position_buckets": 256,
29
- "relative_attention": true,
30
- "share_att_key": true,
31
  "torch_dtype": "float32",
32
  "transformers_version": "4.26.0",
33
- "type_vocab_size": 0,
34
- "vocab_size": 128100
 
35
  }
 
1
  {
2
+ "_name_or_path": "microsoft/BiomedNLP-PubMedBERT-large-uncased-abstract",
3
  "architectures": [
4
+ "BertForQuestionAnswering"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "eos_token_ids": 0,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 1024,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 4096,
15
+ "layer_norm_eps": 1e-12,
16
  "max_position_embeddings": 512,
17
+ "model_type": "bert",
 
 
18
  "num_attention_heads": 16,
19
  "num_hidden_layers": 24,
20
+ "output_past": true,
21
  "pad_token_id": 0,
22
+ "position_embedding_type": "absolute",
 
 
 
 
 
 
 
 
 
 
23
  "torch_dtype": "float32",
24
  "transformers_version": "4.26.0",
25
+ "type_vocab_size": 2,
26
+ "use_cache": true,
27
+ "vocab_size": 30522
28
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cea72aad0037c513cd906e1cf46f9e634a9f99a76a67581a9e8a7b16893e3110
3
- size 1736194351
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b248ce617ef5e6e35acaf865a71fb764a418f05b40bdbe66865bff05976c5490
3
+ size 1336507185
runs/Mar20_01-57-58_g002/1679273885.6293068/events.out.tfevents.1679273885.g002.189082.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afba8cf8b0a042e379f8cfe4a2a1f32dda2b4d599de79131d83767a45f105cc3
3
+ size 5680
runs/Mar20_01-57-58_g002/events.out.tfevents.1679273885.g002.189082.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb9717bc9a7556f366833995b1925b80eb52e75f805c888506a5daa85b01c499
3
+ size 4050
special_tokens_map.json CHANGED
@@ -1,7 +1,5 @@
1
  {
2
- "bos_token": "[CLS]",
3
  "cls_token": "[CLS]",
4
- "eos_token": "[SEP]",
5
  "mask_token": "[MASK]",
6
  "pad_token": "[PAD]",
7
  "sep_token": "[SEP]",
 
1
  {
 
2
  "cls_token": "[CLS]",
 
3
  "mask_token": "[MASK]",
4
  "pad_token": "[PAD]",
5
  "sep_token": "[SEP]",
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,17 +1,16 @@
1
  {
2
- "bos_token": "[CLS]",
3
  "cls_token": "[CLS]",
4
- "do_lower_case": false,
5
- "eos_token": "[SEP]",
6
  "mask_token": "[MASK]",
7
  "model_max_length": 1000000000000000019884624838656,
8
- "name_or_path": "microsoft/deberta-v3-large",
 
9
  "pad_token": "[PAD]",
10
  "sep_token": "[SEP]",
11
- "sp_model_kwargs": {},
12
  "special_tokens_map_file": null,
13
- "split_by_punct": false,
14
- "tokenizer_class": "DebertaV2Tokenizer",
15
- "unk_token": "[UNK]",
16
- "vocab_type": "spm"
17
  }
 
1
  {
 
2
  "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": true,
5
  "mask_token": "[MASK]",
6
  "model_max_length": 1000000000000000019884624838656,
7
+ "name_or_path": "microsoft/BiomedNLP-PubMedBERT-large-uncased-abstract",
8
+ "never_split": null,
9
  "pad_token": "[PAD]",
10
  "sep_token": "[SEP]",
 
11
  "special_tokens_map_file": null,
12
+ "strip_accents": null,
13
+ "tokenize_chinese_chars": true,
14
+ "tokenizer_class": "BertTokenizer",
15
+ "unk_token": "[UNK]"
16
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f007bd5dd6b29c8b5637328b28dbbc23563841601a5be9e125a7c1862307c361
3
  size 3503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b40f1673bab2022942080c2e359df4f8de328fe43ec253f4d45cae38e4d76254
3
  size 3503
vocab.txt ADDED
The diff for this file is too large to render. See raw diff