versae commited on
Commit
8b75ee9
1 Parent(s): 984f903

Training in progress, epoch 1

Browse files
.gitattributes CHANGED
@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1 @@
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1 @@
 
1
+ {"[MASK]": 250101}
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/mdeberta-v3-base",
3
+ "architectures": [
4
+ "DebertaV2ForMultipleChoice"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 768,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 3072,
12
+ "layer_norm_eps": 1e-07,
13
+ "max_position_embeddings": 512,
14
+ "max_relative_positions": -1,
15
+ "model_type": "deberta-v2",
16
+ "norm_rel_ebd": "layer_norm",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "pooler_dropout": 0,
21
+ "pooler_hidden_act": "gelu",
22
+ "pooler_hidden_size": 768,
23
+ "pos_att_type": [
24
+ "p2c",
25
+ "c2p"
26
+ ],
27
+ "position_biased_input": false,
28
+ "position_buckets": 256,
29
+ "relative_attention": true,
30
+ "share_att_key": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.19.0",
33
+ "type_vocab_size": 0,
34
+ "vocab_size": 251000
35
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9770b2b835701927491355e10dbbb9887dc30ac0b8f181de98f16af181e4ae7c
3
+ size 1115312683
runs/May22_18-29-21_ficino/1653236975.7186632/events.out.tfevents.1653236975.ficino.102708.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:909d65b57988a901f31325a2c13e3b8a23135e185ba933c74ff80907e6d4c6d3
3
+ size 5224
runs/May22_18-29-21_ficino/1653236982.6658745/events.out.tfevents.1653236982.ficino.102708.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37a9f423560d5002d45f7d42149fbad4572caac2a2375eeb8c55cd66eb45884b
3
+ size 5224
runs/May22_18-29-21_ficino/1653236983.8893442/events.out.tfevents.1653236983.ficino.102708.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:879d7b8c69c626ba7202b0462c878f76acb4087b9dd3298ee46a98046faab268
3
+ size 5224
runs/May22_18-29-21_ficino/1653236986.2733886/events.out.tfevents.1653236986.ficino.102708.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f6865dd95b8672900bde818447780278785e0cb64e279d228911cd2ac9077e9
3
+ size 5224
runs/May22_18-29-21_ficino/1653236986.971763/events.out.tfevents.1653236986.ficino.102708.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a4b8921418a12062cfb7caa96b9adadbb81c6ad515ef1d794c6d5f22553a72f
3
+ size 5224
runs/May22_18-29-21_ficino/events.out.tfevents.1653236975.ficino.102708.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:598921e828c0108307722083b2eeefc3b4b992a17af65fa4e4d10b138417c0c2
3
+ size 18410
runs/May22_18-31-38_ficino/1653237110.7614782/events.out.tfevents.1653237110.ficino.105698.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a9684136bc7eea438bc025840029e207b4f173d9edff281a52bf0705718d85
3
+ size 5224
runs/May22_18-31-38_ficino/1653237127.270303/events.out.tfevents.1653237127.ficino.105698.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b76407bce14d23072c06dbf10d513b810999562c280ce8dc077b39844adc150
3
+ size 5224
runs/May22_18-31-38_ficino/events.out.tfevents.1653237110.ficino.105698.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6f791d764e6e71455440c144bd1d1e8a8365a3cf935084d389f0c9a1016a779
3
+ size 7388
runs/May22_18-35-39_ficino/1653237351.2236302/events.out.tfevents.1653237351.ficino.110672.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ebf4a9b3f51b0aa759765cd263aef65cea74fbf0f8c048517143d225b6b364d
3
+ size 5224
runs/May22_18-35-39_ficino/events.out.tfevents.1653237351.ficino.110672.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be999d37e86b46af20cace0aa751c94bdcb7bf799b41e4ce9f10da25e8406e89
3
+ size 4351
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
1
+ {"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13c8d666d62a7bc4ac8f040aab68e942c861f93303156cc28f5c7e885d86d6e3
3
+ size 4305025
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f06fc3bbcbbc8f07be861b9a6a69e177247bc549b2bcbf0483e4dd98c06b6f6
3
+ size 16331301
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
1
+ {"do_lower_case": false, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "split_by_punct": false, "vocab_type": "spm", "special_tokens_map_file": null, "name_or_path": "microsoft/mdeberta-v3-base", "sp_model_kwargs": {}, "tokenizer_class": "DebertaV2Tokenizer"}
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d60598dfafe22c79edaed86a5e4ddd18cc492a05b0744afc3caa3119e1f739d
3
+ size 3247