domenicrosati commited on
Commit
17578f0
1 Parent(s): df58c50

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,25 +1,25 @@
1
  {
2
- "_name_or_path": "microsoft/deberta-v3-small",
3
  "architectures": [
4
  "DebertaV2ForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
- "hidden_size": 768,
10
  "initializer_range": 0.02,
11
- "intermediate_size": 3072,
12
  "layer_norm_eps": 1e-07,
13
  "max_position_embeddings": 512,
14
  "max_relative_positions": -1,
15
  "model_type": "deberta-v2",
16
  "norm_rel_ebd": "layer_norm",
17
- "num_attention_heads": 12,
18
- "num_hidden_layers": 6,
19
  "pad_token_id": 0,
20
  "pooler_dropout": 0,
21
  "pooler_hidden_act": "gelu",
22
- "pooler_hidden_size": 768,
23
  "pos_att_type": [
24
  "p2c",
25
  "c2p"
 
1
  {
2
+ "_name_or_path": "microsoft/deberta-v3-xsmall",
3
  "architectures": [
4
  "DebertaV2ForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 384,
10
  "initializer_range": 0.02,
11
+ "intermediate_size": 1536,
12
  "layer_norm_eps": 1e-07,
13
  "max_position_embeddings": 512,
14
  "max_relative_positions": -1,
15
  "model_type": "deberta-v2",
16
  "norm_rel_ebd": "layer_norm",
17
+ "num_attention_heads": 6,
18
+ "num_hidden_layers": 12,
19
  "pad_token_id": 0,
20
  "pooler_dropout": 0,
21
  "pooler_hidden_act": "gelu",
22
+ "pooler_hidden_size": 384,
23
  "pos_att_type": [
24
  "p2c",
25
  "c2p"
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d0491101a52e09f2df1773d89d8e5c386abf554b4af21a818a2ec3d57139549
3
- size 567625195
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fe2ef5cf2eb6b29a846dbecbf490ccf990329ed213c38424ec170965cad36df
3
+ size 283395115
runs/Jan31_21-48-38_020be3d3978e/1675201739.9608088/events.out.tfevents.1675201739.020be3d3978e.43590.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b451dd592f2528fcd8c1e81f79b42921c1dbbcfcc624f0ba721f7dba7e45ea8
3
+ size 5348
runs/Jan31_21-48-38_020be3d3978e/events.out.tfevents.1675201732.020be3d3978e.43590.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbf7dde330e778ecba0072df85f7001386ecc117bec5f24033518c11bba18fd9
3
+ size 341
runs/Jan31_21-50-22_020be3d3978e/1675201844.0813227/events.out.tfevents.1675201844.020be3d3978e.44173.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f7a4574a97847dfa50540217b36f357e91c24de9904d5bb5ff895db1c1125be
3
+ size 5348
runs/Jan31_21-50-22_020be3d3978e/events.out.tfevents.1675201836.020be3d3978e.44173.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac60f36d64dd644d73d593da183b762e871416c677c64f98e31edf12d2eeac9
3
+ size 4072
runs/Jan31_22-03-26_020be3d3978e/1675202622.96545/events.out.tfevents.1675202622.020be3d3978e.44693.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3ca3b2e1eeb72ebfc569cabbbce04f303771710cdd9bb194fbc1c65ba033549
3
+ size 5348
runs/Jan31_22-03-26_020be3d3978e/events.out.tfevents.1675202615.020be3d3978e.44693.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a68ddf24f6730f23c53631c59cba69e12dcec1b5890b466d95bb4ebec67d785a
3
+ size 4442
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 256,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
tokenizer_config.json CHANGED
@@ -4,7 +4,7 @@
4
  "do_lower_case": false,
5
  "eos_token": "[SEP]",
6
  "mask_token": "[MASK]",
7
- "name_or_path": "microsoft/deberta-v3-small",
8
  "pad_token": "[PAD]",
9
  "sep_token": "[SEP]",
10
  "sp_model_kwargs": {},
 
4
  "do_lower_case": false,
5
  "eos_token": "[SEP]",
6
  "mask_token": "[MASK]",
7
+ "name_or_path": "microsoft/deberta-v3-xsmall",
8
  "pad_token": "[PAD]",
9
  "sep_token": "[SEP]",
10
  "sp_model_kwargs": {},
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9172f3e6f008f793f3dda546fa67314678c015c39fac4b86674b30f66175ddb0
3
  size 3375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dae3860dcd6a23f6a49f71505a6f79cc3c8736d743e499a15d95ec5a3624903f
3
  size 3375