autoevaluator's picture
Add evaluation results on the samsum config and test split of samsum
79280ec
|
raw
history blame
2.31 kB
metadata
pipeline_tag: summarization
model-index:
  - name: 0x70DA/pegasus-cnn_dailymail
    results:
      - task:
          type: summarization
          name: Summarization
        dataset:
          name: samsum
          type: samsum
          config: samsum
          split: test
        metrics:
          - type: rouge
            value: 46.2339
            name: ROUGE-1
            verified: true
            verifyToken: >-
              eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOTcyMTMzNzM0ZWZiM2Y1MGRlMGM4ZjRjMWM4ZGUxMzA3ZDNkYzBhMDU0NzQ1MTdjY2VkMjFiZGMyODQ4ZmRhMSIsInZlcnNpb24iOjF9.mk7dNvRAmUH7oBHerwfPAK8fUYDbTbyqNPpY9Stth14vUjYSVAKMpS-Bc5HWXatA-8CUTEDTWD3DS1oqYvZmBQ
          - type: rouge
            value: 23.0428
            name: ROUGE-2
            verified: true
            verifyToken: >-
              eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMDg4MmJjMzY1OWFmZGIxODY2N2MyNjhmOTBjYTI4Mzk0NmY1OTUxMzUxOGJmNzM5OTVjNTM4NDQ1ZTJmMGU4NSIsInZlcnNpb24iOjF9.HviUXjc0Gnk1OLgrCGCM0_xcWZKjpBYem0drJAxfv6zUmev4qm8DNBMgFkN7dIi3E9rDV3IRfRbnRvq3dFv_BQ
          - type: rouge
            value: 36.9683
            name: ROUGE-L
            verified: true
            verifyToken: >-
              eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMGVhYzFkZjAwNjliNzcyODJlNmZmYmIzOTUyZGZlMDA4MGM4MWIxNTAxYWQzNTM4MjBhZTJiZDhkZTRlZjg4YSIsInZlcnNpb24iOjF9.B-sZ9a5r5vyiRyIrpTqiKVKcSoxVU9jK4SVUyf-I4gAiJlkjmjPgxIeQCrsqVyAYgdWB8dT55XdmHH2PKzrsDA
          - type: rouge
            value: 42.3904
            name: ROUGE-LSUM
            verified: true
            verifyToken: >-
              eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYTBmNzJiOGExOTE4YjE2NWNkM2Q0OWU1OGZkMWZiMDkwYTg4MjE2ZWIwMmVjN2U3OTg0YWE3NWRhYzZkYWU4MyIsInZlcnNpb24iOjF9.zoDfAowrohlYEtzVjNx2Es47EA8pTDAp8EEJSSsVsPWO-tvbbrfYiaKU4fn5ZeBmse8gPAfI2aTtdd9zwRBkCg
          - type: loss
            value: 1.431406021118164
            name: loss
            verified: true
            verifyToken: >-
              eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMDc3ZDZmODBmOWM3NDE3NGI2NmFmYTY4NzY2ZWZiYWMwMzA1ZGEwNGQwNTk3OTczY2NmMzQyMjgxYzM3YzNjZiIsInZlcnNpb24iOjF9.Og0tL4Sxq4tgbBa6lyNynhdpUoMOYloTyMmfJHJgYu9BveJL1o9JG9xW4paeQUxeUTUpxVy4c9r_gfpaC1mYAQ
          - type: gen_len
            value: 35.7839
            name: gen_len
            verified: true
            verifyToken: >-
              eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMmZmY2EwNjJiNDJhNmRlYjFmYjA5OGMyZWY2YmMyZmIyOTU0MGNmNTNjYjkwNTdmNmM0OGNiMTk1MGIxM2I4ZSIsInZlcnNpb24iOjF9.uDEOBFKTf3pM8_Ftjkr7asJj7gsnS4DmnZCVwL7vMGt2FiOzlYKRBKxB35JPHrcBNl6TI0c_0HApzdjFqiabDQ