GlycerinLOL commited on
Commit
d9994e7
1 Parent(s): 0b24e67

Training in progress, step 500

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ generated_predictions.json filter=lfs diff=lfs merge=lfs -text
all_results.json CHANGED
@@ -1,12 +1,15 @@
1
  {
2
- "predict_gen_len": 28.834,
3
- "predict_loss": 1.8422898054122925,
4
- "predict_rouge1": 0.4278,
5
- "predict_rouge2": 0.1789,
6
- "predict_rougeL": 0.3407,
7
- "predict_rougeLsum": 0.3407,
8
- "predict_runtime": 2061.934,
 
 
 
9
  "predict_samples": 11334,
10
- "predict_samples_per_second": 5.497,
11
- "predict_steps_per_second": 0.172
12
  }
 
1
  {
2
+ "predict_f1": 0.906,
3
+ "predict_gen_len": 30.77916004940886,
4
+ "predict_loss": 1.6894419193267822,
5
+ "predict_precision": 0.9008,
6
+ "predict_recall": 0.9115,
7
+ "predict_rouge1": 0.4408,
8
+ "predict_rouge2": 0.1888,
9
+ "predict_rougeL": 0.3528,
10
+ "predict_rougeLsum": 0.3528,
11
+ "predict_runtime": 3437.6578,
12
  "predict_samples": 11334,
13
+ "predict_samples_per_second": 3.297,
14
+ "predict_steps_per_second": 0.412
15
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "Models/LLM_Teached_Pegasus_Large",
3
  "activation_dropout": 0.1,
4
  "activation_function": "relu",
5
  "add_bias_logits": false,
 
1
  {
2
+ "_name_or_path": "google/pegasus-large",
3
  "activation_dropout": 0.1,
4
  "activation_function": "relu",
5
  "add_bias_logits": false,
generated_predictions.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecfb91cde9f4511dac83b80773fe9ee62662db70716fef5053335fca4b6b7417
3
+ size 27483141
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab52b4b7f1b050bd880fa12529d3c148fdd68fce219a518cfcb8e630a158c091
3
  size 2283652852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dcd871daccefb604319e20da7a0b9417139e5708de62c77da9decf2ca46f79f
3
  size 2283652852
predict_results.json CHANGED
@@ -1,12 +1,15 @@
1
  {
2
- "predict_gen_len": 28.834,
3
- "predict_loss": 1.8422898054122925,
4
- "predict_rouge1": 0.4278,
5
- "predict_rouge2": 0.1789,
6
- "predict_rougeL": 0.3407,
7
- "predict_rougeLsum": 0.3407,
8
- "predict_runtime": 2061.934,
 
 
 
9
  "predict_samples": 11334,
10
- "predict_samples_per_second": 5.497,
11
- "predict_steps_per_second": 0.172
12
  }
 
1
  {
2
+ "predict_f1": 0.906,
3
+ "predict_gen_len": 30.77916004940886,
4
+ "predict_loss": 1.6894419193267822,
5
+ "predict_precision": 0.9008,
6
+ "predict_recall": 0.9115,
7
+ "predict_rouge1": 0.4408,
8
+ "predict_rouge2": 0.1888,
9
+ "predict_rougeL": 0.3528,
10
+ "predict_rougeLsum": 0.3528,
11
+ "predict_runtime": 3437.6578,
12
  "predict_samples": 11334,
13
+ "predict_samples_per_second": 3.297,
14
+ "predict_steps_per_second": 0.412
15
  }
runs/Dec28_18-55-30_n4bcoectr1703727001286-fmclw/events.out.tfevents.1703760935.n4bcoectr1703727001286-fmclw.222322.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6250ade1582b24a7e41a8e898a74a51ff41cc6f08621135abe92d27f3acfe73c
3
+ size 7114
special_tokens_map.json CHANGED
@@ -103,32 +103,8 @@
103
  "<unk_101>",
104
  "<unk_102>"
105
  ],
106
- "eos_token": {
107
- "content": "</s>",
108
- "lstrip": false,
109
- "normalized": false,
110
- "rstrip": false,
111
- "single_word": false
112
- },
113
- "mask_token": {
114
- "content": "<mask_2>",
115
- "lstrip": false,
116
- "normalized": false,
117
- "rstrip": false,
118
- "single_word": false
119
- },
120
- "pad_token": {
121
- "content": "<pad>",
122
- "lstrip": false,
123
- "normalized": false,
124
- "rstrip": false,
125
- "single_word": false
126
- },
127
- "unk_token": {
128
- "content": "<unk>",
129
- "lstrip": false,
130
- "normalized": false,
131
- "rstrip": false,
132
- "single_word": false
133
- }
134
  }
 
103
  "<unk_101>",
104
  "<unk_102>"
105
  ],
106
+ "eos_token": "</s>",
107
+ "mask_token": "<mask_2>",
108
+ "pad_token": "<pad>",
109
+ "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
110
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -958,14 +958,10 @@
958
  "full_tokenizer_file": null,
959
  "mask_token": "<mask_2>",
960
  "mask_token_sent": "<mask_1>",
961
- "max_length": 64,
962
  "model_max_length": 1024,
963
  "offset": 103,
964
  "pad_token": "<pad>",
965
  "sp_model_kwargs": {},
966
- "stride": 0,
967
  "tokenizer_class": "PegasusTokenizer",
968
- "truncation_side": "right",
969
- "truncation_strategy": "longest_first",
970
  "unk_token": "<unk>"
971
  }
 
958
  "full_tokenizer_file": null,
959
  "mask_token": "<mask_2>",
960
  "mask_token_sent": "<mask_1>",
 
961
  "model_max_length": 1024,
962
  "offset": 103,
963
  "pad_token": "<pad>",
964
  "sp_model_kwargs": {},
 
965
  "tokenizer_class": "PegasusTokenizer",
 
 
966
  "unk_token": "<unk>"
967
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8c42f961a10319a18532a4b16bc9ea097d53e9ca0abae8d756ba4eb4b19798f
3
  size 4475
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a26d5b9dfa3bfcfd0497091597f4c9fea4cbd5ce2b580f26831e93dbcb596500
3
  size 4475