spacemanidol commited on
Commit
272d531
1 Parent(s): 65e05e0

Upload 13 files

Browse files
README.md CHANGED
@@ -6,7 +6,7 @@ datasets:
6
  metrics:
7
  - rouge
8
  model-index:
9
- - name: small-2-6-t
10
  results:
11
  - task:
12
  name: Summarization
@@ -26,9 +26,9 @@ model-index:
26
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
27
  should probably proofread and complete it, then remove this comment. -->
28
 
29
- # small-2-6-t
30
 
31
- This model is a fine-tuned version of [asy/cnndm/small-2-6/](https://huggingface.co/asy/cnndm/small-2-6/) on the cnn_dailymail 3.0.0 dataset.
32
  It achieves the following results on the evaluation set:
33
  - Loss: 1.8186
34
  - Rouge1: 36.8241
 
6
  metrics:
7
  - rouge
8
  model-index:
9
+ - name: small-2-6
10
  results:
11
  - task:
12
  name: Summarization
 
26
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
27
  should probably proofread and complete it, then remove this comment. -->
28
 
29
+ # small-2-6
30
 
31
+ This model is a fine-tuned version of [cnn/small-2-6/](https://huggingface.co/cnn/small-2-6/) on the cnn_dailymail 3.0.0 dataset.
32
  It achieves the following results on the evaluation set:
33
  - Loss: 1.8186
34
  - Rouge1: 36.8241
all_results.json CHANGED
@@ -6,13 +6,13 @@
6
  "eval_rouge2": 15.5366,
7
  "eval_rougeL": 25.7939,
8
  "eval_rougeLsum": 33.9987,
9
- "eval_runtime": 2895.1594,
10
  "eval_samples": 13368,
11
- "eval_samples_per_second": 4.617,
12
- "eval_steps_per_second": 1.154,
13
  "train_loss": 2.1428533047548393,
14
- "train_runtime": 18639.2458,
15
  "train_samples": 287113,
16
- "train_samples_per_second": 46.211,
17
- "train_steps_per_second": 0.722
18
  }
 
6
  "eval_rouge2": 15.5366,
7
  "eval_rougeL": 25.7939,
8
  "eval_rougeLsum": 33.9987,
9
+ "eval_runtime": 2940.0108,
10
  "eval_samples": 13368,
11
+ "eval_samples_per_second": 4.547,
12
+ "eval_steps_per_second": 1.137,
13
  "train_loss": 2.1428533047548393,
14
+ "train_runtime": 19152.4549,
15
  "train_samples": 287113,
16
+ "train_samples_per_second": 44.973,
17
+ "train_steps_per_second": 0.703
18
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "asy/cnndm/small-2-6/",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
 
1
  {
2
+ "_name_or_path": "cnn/small-2-6/",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
eval_results.json CHANGED
@@ -6,8 +6,8 @@
6
  "eval_rouge2": 15.5366,
7
  "eval_rougeL": 25.7939,
8
  "eval_rougeLsum": 33.9987,
9
- "eval_runtime": 2895.1594,
10
  "eval_samples": 13368,
11
- "eval_samples_per_second": 4.617,
12
- "eval_steps_per_second": 1.154
13
  }
 
6
  "eval_rouge2": 15.5366,
7
  "eval_rougeL": 25.7939,
8
  "eval_rougeLsum": 33.9987,
9
+ "eval_runtime": 2940.0108,
10
  "eval_samples": 13368,
11
+ "eval_samples_per_second": 4.547,
12
+ "eval_steps_per_second": 1.137
13
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 2.1428533047548393,
4
- "train_runtime": 18639.2458,
5
  "train_samples": 287113,
6
- "train_samples_per_second": 46.211,
7
- "train_steps_per_second": 0.722
8
  }
 
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 2.1428533047548393,
4
+ "train_runtime": 19152.4549,
5
  "train_samples": 287113,
6
+ "train_samples_per_second": 44.973,
7
+ "train_steps_per_second": 0.703
8
  }
trainer_state.json CHANGED
@@ -168,9 +168,9 @@
168
  "step": 13458,
169
  "total_flos": 2.4076495124138803e+17,
170
  "train_loss": 2.1428533047548393,
171
- "train_runtime": 18639.2458,
172
- "train_samples_per_second": 46.211,
173
- "train_steps_per_second": 0.722
174
  }
175
  ],
176
  "max_steps": 13458,
 
168
  "step": 13458,
169
  "total_flos": 2.4076495124138803e+17,
170
  "train_loss": 2.1428533047548393,
171
+ "train_runtime": 19152.4549,
172
+ "train_samples_per_second": 44.973,
173
+ "train_steps_per_second": 0.703
174
  }
175
  ],
176
  "max_steps": 13458,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08155c889cb72a78ddd30a185fb53e42d1c84af4bd0f6bb896261b52826ff100
3
- size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d39a5cd2672486ff40d8dc32363ebf1a136ab4beb6f5ee593c485030f64d336
3
+ size 3707