theojolliffe commited on
Commit
5c00170
1 Parent(s): 988c2b5

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,8 +1,9 @@
1
  {
2
- "_name_or_path": "facebook/bart-large-cnn",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
 
6
  "add_final_layer_norm": false,
7
  "architectures": [
8
  "BartForConditionalGeneration"
@@ -15,7 +16,7 @@
15
  "decoder_attention_heads": 16,
16
  "decoder_ffn_dim": 4096,
17
  "decoder_layerdrop": 0.0,
18
- "decoder_layers": 12,
19
  "decoder_start_token_id": 2,
20
  "dropout": 0.1,
21
  "early_stopping": true,
@@ -24,8 +25,10 @@
24
  "encoder_layerdrop": 0.0,
25
  "encoder_layers": 12,
26
  "eos_token_id": 2,
27
- "force_bos_token_to_be_generated": true,
28
- "forced_bos_token_id": 0,
 
 
29
  "forced_eos_token_id": 2,
30
  "gradient_checkpointing": false,
31
  "id2label": {
@@ -40,29 +43,26 @@
40
  "LABEL_1": 1,
41
  "LABEL_2": 2
42
  },
43
- "length_penalty": 2.0,
44
- "max_length": 142,
45
  "max_position_embeddings": 1024,
46
- "min_length": 56,
47
  "model_type": "bart",
48
  "no_repeat_ngram_size": 3,
49
  "normalize_before": false,
50
- "num_beams": 4,
 
51
  "num_hidden_layers": 12,
52
  "output_past": true,
53
  "pad_token_id": 1,
54
  "prefix": " ",
 
 
55
  "scale_embedding": false,
56
- "task_specific_params": {
57
- "summarization": {
58
- "early_stopping": true,
59
- "length_penalty": 2.0,
60
- "max_length": 142,
61
- "min_length": 56,
62
- "no_repeat_ngram_size": 3,
63
- "num_beams": 4
64
- }
65
- },
66
  "torch_dtype": "float32",
67
  "transformers_version": "4.28.1",
68
  "use_cache": true,
 
1
  {
2
+ "_name_or_path": "sshleifer/distilbart-xsum-12-6",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
6
+ "add_bias_logits": false,
7
  "add_final_layer_norm": false,
8
  "architectures": [
9
  "BartForConditionalGeneration"
 
16
  "decoder_attention_heads": 16,
17
  "decoder_ffn_dim": 4096,
18
  "decoder_layerdrop": 0.0,
19
+ "decoder_layers": 6,
20
  "decoder_start_token_id": 2,
21
  "dropout": 0.1,
22
  "early_stopping": true,
 
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 12,
27
  "eos_token_id": 2,
28
+ "eos_token_ids": [
29
+ 2
30
+ ],
31
+ "extra_pos_embeddings": 2,
32
  "forced_eos_token_id": 2,
33
  "gradient_checkpointing": false,
34
  "id2label": {
 
43
  "LABEL_1": 1,
44
  "LABEL_2": 2
45
  },
46
+ "length_penalty": 0.5,
47
+ "max_length": 62,
48
  "max_position_embeddings": 1024,
49
+ "min_length": 11,
50
  "model_type": "bart",
51
  "no_repeat_ngram_size": 3,
52
  "normalize_before": false,
53
+ "normalize_embedding": true,
54
+ "num_beams": 6,
55
  "num_hidden_layers": 12,
56
  "output_past": true,
57
  "pad_token_id": 1,
58
  "prefix": " ",
59
+ "replacing_rate": 0,
60
+ "save_step": 58,
61
  "scale_embedding": false,
62
+ "static_position_embeddings": false,
63
+ "student_decoder_layers": null,
64
+ "student_encoder_layers": null,
65
+ "task_specific_params": {},
 
 
 
 
 
 
66
  "torch_dtype": "float32",
67
  "transformers_version": "4.28.1",
68
  "use_cache": true,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8577d66fd770bd0b6e6221be6393cd9e5830cfe5849488cbe10d6d30fceeb01c
3
- size 1625537293
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61af7dbaf40b66e1411ba12d137a1ad9555c082f683bae587b6c52ed676df22e
3
+ size 1222363741
runs/Apr22_12-18-45_0943f7874f3f/1682166323.1325157/events.out.tfevents.1682166323.0943f7874f3f.184.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ab88e794da596ec4676dbe35ecd045e4caf3093e5c48d8ddd45a0f5dc4b35c
3
+ size 6182
runs/Apr22_12-18-45_0943f7874f3f/events.out.tfevents.1682166323.0943f7874f3f.184.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6db05d422981e156f9747705258dc1a0ff9d0a24f0aed196cc78a2a8ddf31b7
3
+ size 5317
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d090541b797207cd5d97fec2e8071952f7386cea72f7a776de1b78eaa21b1ec3
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f4f505825ebe3eeadd2e439b069a4bda24a9a30bb879b8ea16bffc792aae427
3
  size 3771