File size: 5,682 Bytes
158e71f 8d5900d 158e71f c7c5e70 df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d df3965c 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 8a9f9df 8d5900d 158e71f 91952c7 158e71f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 |
---
license:
- apache-2.0
- bsd-3-clause
tags:
- summarization
- summary
- booksum
- long-document
- long-form
datasets:
- kmfoda/booksum
metrics:
- rouge
inference: false
model-index:
- name: pszemraj/long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP14
results:
- task:
type: summarization
name: Summarization
dataset:
name: samsum
type: samsum
config: samsum
split: test
metrics:
- type: rouge
value: 23.5177
name: ROUGE-1
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMjMxNGRmYjc0ZjNmZWY3YjFjNDEzYjRhYTAyNWNkOGQ3ODMzM2EwMzk0NTVkMzQ5MGMyYjYxMTkzYWQyMjZiMyIsInZlcnNpb24iOjF9.-PPUZc4Jr6EjNcQ-u9n814SfeviFEaddbFco5d1wbJNoECN_HqciNphSjXh7w99I_rQ6rPIXu8DA93u7aFj9CA
- type: rouge
value: 4.668
name: ROUGE-2
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMWMwYWI1NTg0ZTUwNGIwZjlhYWU2MzQwN2I0NzA1M2MyOTA5YjQ4MTEyYzU2MjRmZTA0NzNiYWM2ZDU0ZThhYyIsInZlcnNpb24iOjF9.CQfgJ3Lha9XR2-IudjfFuaUh_uphWPdYk6TMQOLriWM78_X-paqEIBZDh1Q-WbWoUf-CAyf6UvqXqELRDb3hBQ
- type: rouge
value: 16.6091
name: ROUGE-L
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzhkODRjM2FiYTFhN2E5MWFiNzk3MjgzMGI0NmY0ODNkYjAxZWNmYmFmYmY0NDBmNjRmOTBkMGVhMGYzMmRkMCIsInZlcnNpb24iOjF9.Y66qsqvvGeAoiMCr1xa9enBMfcXt6a6I2i5s7VAJ3aoh3DtM2RlaMm4nuXG4uzWHedWW1NDivBWMZtycYed9DA
- type: rouge
value: 20.3174
name: ROUGE-LSUM
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZWJjODE5NDdlMjM2YjNkOWU3NDJiMWFlZGU2YTRkNzliMTg5MGNkNDQ3YWU3MTBmY2E5ZTUxMzEyMDc0ZTU5YiIsInZlcnNpb24iOjF9.Kc1accwOycbNU1F7AT8LV8jC3NpYKMmOsZmdLeDdIi5BqgMJcQSP8oNt3L-hGbscLb-D7iIvQBFtmmiGqpnGDQ
- type: loss
value: 3.2174887657165527
name: loss
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNTQ0MzQxYTQ1M2NiODcwNTBjOTRiMGEzZDE0NDFlZWJlNmNlOWI1M2M1N2Q2ZTVkNWFiMzQxNDhjODQxNDFkYSIsInZlcnNpb24iOjF9.Vat1Thj2t_1of477BCINeYoTeNZX1NIPG13qVskJ44ivKLJgMr4BCp0luYNEi2skNTv3kYK2orqBdDfxPZlfDw
- type: gen_len
value: 57.1966
name: gen_len
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiY2I3MmZkMDY1YmM5N2VmMGE5OWQ0NDg5OWM0OWViMzU1ZTM1NjBmYWRmN2I2YmM5YTVkNGVlZGViNWEwOGYwMyIsInZlcnNpb24iOjF9.4c6j-ll2veK_PuCcXvRK8-8cPFdedKsqGHQsEhGpwj48uwI3PMqj9mF4HYvSGq5H3rVM_dvyPEEs9RhjCvSHBw
- task:
type: summarization
name: Summarization
dataset:
name: kmfoda/booksum
type: kmfoda/booksum
config: kmfoda--booksum
split: test
metrics:
- type: rouge
value: 35.9884
name: ROUGE-1
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNWMzODFmZGYwZmNjY2FkZTJmZWYyMjI1NDdlZDI3OTdmY2MzNzU0M2FhYmMxNTdkOGRiNzIwMTEyMTMwMTgyMSIsInZlcnNpb24iOjF9.pbT1OOzVOjnUp4q6lcpUPunDYTQqOiwQeRLRV69699SoMI3ay4bfd_hbWZUvXOuivoJ5JiDd9KBhEqYUninNCA
- type: rouge
value: 6.0596
name: ROUGE-2
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODNkNTE1NjU5ZmY3MmVmOGQxMjhhODRhZjIzMDRhMzJlYTY3YTkyNzM4YTAyMGI2YzRlMzljMDM5YzFjNzIyOCIsInZlcnNpb24iOjF9.NevkOank_Ou1u2ZfkEa3o4FF4DapvpFK_ucxLRm-xL-ZWGl9cLdLTOxVECrTn8Yasi_sWrjZUhGRWPkCKlJADQ
- type: rouge
value: 16.1419
name: ROUGE-L
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzNkM2M4YjQxM2IwNzIzMjAyMjM3MThlMGQwMDgzMGI3NDU0NWVlOTFhMzBlOGQ3ZTQzOGNkNmE5ZGI5NTkzOCIsInZlcnNpb24iOjF9.8DYhyJAiKIK2aIkQSwMy4NEiBSC4v8_h_3feA-TFBdd-icGg5YvKMQR7_IOa1-9AHBe6PphVSFjl82-nDp6lDA
- type: rouge
value: 32.9992
name: ROUGE-LSUM
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMTEwMmViZmZjMzA3OWYxNWMxZjFhMDBmMDRjOGViYzdiYzllNzk0YWZmNTU0NWIwMmVmZjQzNjlkZTBmZTU0YyIsInZlcnNpb24iOjF9.KFwuSVaUXx958EWZctKpK1wawA0EH4yxBJdp3Zru4Sn97oSyP_s5m-jjZiLfP6kmSajd3849dna-Uw77s3sVBg
- type: loss
value: 2.9468588829040527
name: loss
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzhmODMwMDM2ZDFmNTMzZmFjMmJjMGQ0MmQzMDcyMmFiNmFjMzBhY2RjMTI1MDhiMjI4NTEyYWFlYTNlMzE0ZSIsInZlcnNpb24iOjF9.PHX9VAAgiUGOR8Uxuam4otU65hIzW6hBapaf1KY8o1FDfaoHWAKbSnpjZ3nXKYYeVV6LyGRny_7RdRbbbM8LAA
- type: gen_len
value: 298.2593
name: gen_len
verified: true
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMGYzMDAzNTQyMzgxM2RhNjY3MDIyNGEyMWZjYmYyYmJlNWM3MTFkYzRjMDhkMmZhNDZiN2FhYTY3MGI2NDcxNyIsInZlcnNpb24iOjF9.ax3H6LohHUodVGhSMUWMZZZ-bCTXHEaGpK4jXuOdZkGsewYrX8fO1oRA0uDjACM-eceKFfVnMveHoU9EdMaeCA
---
# long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP14
This model is a fine-tuned version of [pszemraj/long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP13](https://huggingface.co/pszemraj/long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP13) on the kmfoda/booksum dataset.
## Model description
More information needed
## Intended uses & limitations
More information needed
## Training and evaluation data
More information needed
## Training procedure
### Training hyperparameters
The following hyperparameters were used during training:
- learning_rate: 0.0006
- train_batch_size: 4
- eval_batch_size: 1
- seed: 42
- distributed_type: multi-GPU
- gradient_accumulation_steps: 16
- total_train_batch_size: 64
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
- lr_scheduler_type: cosine
- lr_scheduler_warmup_ratio: 0.02
- num_epochs: 2
### Framework versions
- Transformers 4.22.0
- Pytorch 1.12.1
- Datasets 2.4.0
- Tokenizers 0.12.1
|