--- license: - apache-2.0 - bsd-3-clause tags: - summarization - summary - booksum - long-document - long-form datasets: - kmfoda/booksum metrics: - rouge inference: false base_model: pszemraj/long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP13 model-index: - name: pszemraj/long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP15 results: - task: type: summarization name: Summarization dataset: name: samsum type: samsum config: samsum split: test metrics: - type: rouge value: 24.5482 name: ROUGE-1 verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiM2U3MGNlNzI0MGNiYWQ2NGRhYzg5M2Y3NjhjYTdhZmVlYWNmM2Y0YTFhN2I2ZmI5NDVkY2I2M2MxMjM5ZDIwOSIsInZlcnNpb24iOjF9.tHnV8ofGr9jbx0fHm3cDL6p8nqXZITS1H6XLjW-iWaNFuQJ7Qfs7E0uYNf2haQP6Mu5K5eWWGdg54KtMi1N9DA - type: rouge value: 4.811 name: ROUGE-2 verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzE1ODYzOGFhMDE4ZGU1OTM0OTM5NDBkNjEwODQzY2I1NzRhYTc0NDJjZmM5YzI4ZGZmZGNkZjljYmNlYTQ1YyIsInZlcnNpb24iOjF9.n7tOZFKEePwSEqM7a0Y-fBiEEi3jZL7QwP0MCQNun5yKsd2OIkTlruuauV3h8yHN5yKxg33CUfpzS2B44kGjBg - type: rouge value: 17.2505 name: ROUGE-L verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMjM3YTYwNjAyYzY5MmZjMzI1MmYwNzI2OWNmMzJiNzk3MTY5Y2E4ZmM1OTIyYjQ1NTkxMjI1ZGMwYmRiYzg5NiIsInZlcnNpb24iOjF9.1VQIehrugMj213RavmSAf1qsKTG3Jmj6DAJGi3KOeOYrJpKeLBQ6ftQZ_wSje8UiyR9uekne1wTd256sr61DBQ - type: rouge value: 20.906 name: ROUGE-LSUM verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDdhNjJlOTY3ZjgxOGMzYjkzOGI2NGJlZDY0MDk0NmE5ZDcyMzIyNTA1M2ZhNmMyOTFlODJjZWJkY2ZjMTQ3NCIsInZlcnNpb24iOjF9.SLAdCUY_9PFb7BrvvpN2ABDU9uvy7EIMEHKtnlpH94nZbv2G2sj74tWLcIQstuTkmXmLTk6_HvdZTEaoUc-5CA - type: loss value: 3.3002164363861084 name: loss verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDFkM2UyOWQ5YzM2ZDIwZGRmNTY2YTRlMzUzY2QxZDhkNGFmODljNjIxNWQxZjFhM2E2YjM4ZWRjZDUzNWQxNyIsInZlcnNpb24iOjF9.HUYhxEAGbZS8J76Zt9k5KNFt6dx_vdoqf34k5ht3X0BTB4u2WiYwVS9O0ka2ExCynIODo9OMWLcMG2CW-xnjBA - type: gen_len value: 52 name: gen_len verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZTkxMWQ0ZWVlNWUxNjYwNTU3MTQzYjRhZGI1YjQ1ODYxOGRlNTU0ZjlkOGZiN2UzM2I5MjU3Y2QxODU3MTJmZCIsInZlcnNpb24iOjF9.9iDB-q3h2qYZIRHLKryZIjYYUeN_4_9hr5miRgmJl8TYB1Prf69NNziW7QPOkMXMOM-5-xvRVKmx-JqZQSkcDg - task: type: summarization name: Summarization dataset: name: kmfoda/booksum type: kmfoda/booksum config: kmfoda--booksum split: test metrics: - type: rouge value: 35.3305 name: ROUGE-1 verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiY2Q0NWU1Mjc0ZTYxOGM5NjI3NTlmODYwMmU4ODE3Y2VjYjdmNTRhOWI2MDdlM2U3OTk5N2Q3YTcyYTViYzIwMiIsInZlcnNpb24iOjF9.ScFds-4QZgG0Wro-w0qnoaQSoXXMpWOTEE4zYrvA9k2lew965geaqeBVAt7QQxwchuB9q26hSGYCEqLMdX3EBw - type: rouge value: 5.8001 name: ROUGE-2 verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYjFiNjU2ZjI1YmE2NDViZjUwMjI1ZWFiNDkyMjExZjJjMjBmN2I5ZmYyYjE0MGEzNzk3ZGE4YTMzNzA0M2NjNSIsInZlcnNpb24iOjF9.H4r1JTjEC3ABkgVIi8i3TRxQ1gMsYoQR8qCBbJVkdWJQwECzWGZRw6QIaWz0kZv73nQ890kf90JE6FKeD2MpAg - type: rouge value: 16.0557 name: ROUGE-L verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjBjNTBiYmM3OWM3ZjFkN2FjZTBiMGJkMTg4MTYxYzRjNWUzNWE2YWVjOWJiMzRkZTMxMGFkYThlYmZiN2UwNSIsInZlcnNpb24iOjF9.mLij-24wue3udXSS5H3kBniefh7NDTmNf3bxacq7UinFkbTtqx9OvS6Ywun4LfJj_Ufn9-uTMR2VbaoIIQKkBA - type: rouge value: 32.3409 name: ROUGE-LSUM verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZjg3ODliOTAzYzg4Y2NhNzI4M2I4OGM1ZGQwMWE5ZjBiZGQyNTNhMDQxZDllMzgxOGM0NWZjZTJjMzFkZGVkZSIsInZlcnNpb24iOjF9.LpNcyf7HNaL_xwb4zqrBgOPoTBWFaBN0AgSbzsgfsQ7J12CIi7s0UoBhxg_c8UYwNuqFOZouYIq78r1PM81RCA - type: loss value: 3.0063540935516357 name: loss verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMTJmMGM2Y2U0MDU0OTFlMzJlNTNlZjViYTAyYjE4YTVkOWJhMmQxZjc3MjM4ZGNkNTNmOTViNDYwZjg0MWI0YyIsInZlcnNpb24iOjF9.VLKkHEjp4Iq1r3-CXSABBzgPJFx1sbjRt5KbbKe_AEuKuJtXI6rRWPuBjudOLB-CHBvutDzVS9wR60pGaQ5jCg - type: gen_len value: 268.4032 name: gen_len verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYjJmYjZhOGFkMGNkZjEzOTA0Y2RjNWU3Yjc2ZGI5NWU1MTNjZjY5NzFiZjI0YjBhZjUxMDFlMjBmZTYxMWE0ZCIsInZlcnNpb24iOjF9.vnImpJVQBidfhKVOzEYuA2okKgbTvB0bkc4GNmvkTlxXdZlsqg1KuevQa587lmy0LQOZk1_pYWz0aVJ4VQQQAA - task: type: summarization name: Summarization dataset: name: launch/gov_report type: launch/gov_report config: plain_text split: test metrics: - type: rouge value: 37.0412 name: ROUGE-1 verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOTQ0NzdhYjdlNDNhYjJmNzQwM2E1OWQ3ZTQxMTZiY2IwNjJkMzE0YzNmMWZjZTI0NGI2NWYzNTU0ODM0OTVmMCIsInZlcnNpb24iOjF9.1Gf6zoMOLmf71bkW9RdiXJPDms-vfc0hu0jJehdb7XCjW-hPcmLxdk8ALwWi9knBmeHZ18GHHSJklgU_maFoAA - type: rouge value: 8.519 name: ROUGE-2 verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2M0MTE2YTE5NmE1NjhkMGM0ZjYxMzJiOTFjZGNmOTdlZWFhOTExZTAzOGUyOWE4Yjg4MTE3NDcwZTg5ZDk0MCIsInZlcnNpb24iOjF9.6EeSA2FzddyK5EfHhBViKNDXIZp9svVTpvSi4O_9YULWX6Gs4bZYcGRQATGLS6Pfvh1swky1ZXXR5GpX4tN-Ag - type: rouge value: 17.8685 name: ROUGE-L verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNTZmMWRhZmNmZDY5MzYzM2JhNDc5NzdiMWI3MmRlYWViZjA0NGQxZDJhNjIxZTY3ZTM2NTJjYjI0ODE5MGFlYiIsInZlcnNpb24iOjF9.Tz6vT3YFZO5Hd8BySoXmtcwDQMSvr4DLGvKYpTeH7L0iZOaIFr8XILCPbLV6ZxjglSgFwMzcwsjN1d032mEqBA - type: rouge value: 33.5036 name: ROUGE-LSUM verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzgzNGQyMTIxYWUwMDlkMjQwZDE5ZDRmYzczODJkZTIxOGE5MTEyZDNjYzMzZWFhMGUyMjljNDQ5NGQ4ZGRkOCIsInZlcnNpb24iOjF9.oR8vSpgDjMskRmcImHV4E5dkXbP74BKNYXmfpkpO5zIHIJWNNyJvUSKurDDy5rhbhbkI98kF5GmOcLlfghyrDA - type: loss value: 3.628979444503784 name: loss verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMTNkY2E0Y2Q1YjA3Y2VhYTAyOGE1NmQyYWQ0YzM5NzczOTBkYThiYzNjMDljY2YzZGYzMGQ3NGQ5YzRhN2M5OCIsInZlcnNpb24iOjF9.kD1yDRyt6PR5wKBHvsU4l6stGmcsvPbkGB1dMgSfvMWV0LjjSc3MaXUS2ykNciLdnJK_aSqIjSUbUDyO0e4oDA - type: gen_len value: 219.3885 name: gen_len verified: true verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzI2MjIyZWViY2I0NTE0YWMxYTE3OTAyODdhOTNlZDZkOTIyMjQ1NzdkMmU5YTY5NmNjYTNkOGI0ODk4YzE2OSIsInZlcnNpb24iOjF9.sqlm-kWBzo-sJ4PaelnJWeQ1usF3nM5ZJP8igXE2GhWNhAQVsST3tlvcA8GwRtfbVCAy_x7Ex9iOuYqpccdbDA --- # long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP15 This model is a fine-tuned version of [pszemraj/long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP13](https://huggingface.co/pszemraj/long-t5-tglobal-large-pubmed-3k-booksum-16384-WIP13.5) on the `kmfoda/booksum` dataset. ## Model description More information needed ## Intended uses & limitations More information needed ## Training and evaluation data More information needed ## Training procedure ### Training hyperparameters The following hyperparameters were used during training: - learning_rate: 0.0004 - train_batch_size: 1 - eval_batch_size: 1 - seed: 42 - distributed_type: multi-GPU - gradient_accumulation_steps: 64 - total_train_batch_size: 64 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08 - lr_scheduler_type: cosine - lr_scheduler_warmup_ratio: 0.01 - num_epochs: 1.4 ### Framework versions - Transformers 4.23.0.dev0 - Pytorch 1.10.0+cu113 - Datasets 2.4.0 - Tokenizers 0.12.1