autoevaluator HF staff commited on
Commit
0646c3f
1 Parent(s): deb0f97

Add evaluation results on the samsum config and test split of samsum

Browse files

Beep boop, I am a bot from Hugging Face's automatic model evaluator 👋!\
Your model has been evaluated on the samsum config and test split of the [samsum](https://huggingface.co/datasets/samsum) dataset by @[email protected], using the predictions stored [here](https://huggingface.co/datasets/autoevaluate/autoeval-eval-samsum-samsum-2c8026-46001145176).\
Accept this pull request to see the results displayed on the [Hub leaderboard](https://huggingface.co/spaces/autoevaluate/leaderboards?dataset=samsum).\
Evaluate your model on more datasets [here](https://huggingface.co/spaces/autoevaluate/model-evaluator?dataset=samsum).

Files changed (1) hide show
  1. README.md +53 -14
README.md CHANGED
@@ -1,12 +1,12 @@
1
  ---
2
  language:
3
  - en
 
4
  tags:
5
  - summarization
6
- license: mit
7
- thumbnail: https://huggingface.co/front/thumbnails/facebook.png
8
  datasets:
9
  - cnn_dailymail
 
10
  model-index:
11
  - name: facebook/bart-large-cnn
12
  results:
@@ -19,30 +19,69 @@ model-index:
19
  config: 3.0.0
20
  split: train
21
  metrics:
22
- - name: ROUGE-1
23
- type: rouge
24
  value: 42.9486
 
25
  verified: true
26
- - name: ROUGE-2
27
- type: rouge
28
  value: 20.8149
 
29
  verified: true
30
- - name: ROUGE-L
31
- type: rouge
32
  value: 30.6186
 
33
  verified: true
34
- - name: ROUGE-LSUM
35
- type: rouge
36
  value: 40.0376
 
37
  verified: true
38
- - name: loss
39
- type: loss
40
  value: 2.529000997543335
 
41
  verified: true
42
- - name: gen_len
43
- type: gen_len
44
  value: 78.5866
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
45
  verified: true
 
46
  ---
47
  # BART (large-sized model), fine-tuned on CNN Daily Mail
48
 
 
1
  ---
2
  language:
3
  - en
4
+ license: mit
5
  tags:
6
  - summarization
 
 
7
  datasets:
8
  - cnn_dailymail
9
+ thumbnail: https://huggingface.co/front/thumbnails/facebook.png
10
  model-index:
11
  - name: facebook/bart-large-cnn
12
  results:
 
19
  config: 3.0.0
20
  split: train
21
  metrics:
22
+ - type: rouge
 
23
  value: 42.9486
24
+ name: ROUGE-1
25
  verified: true
26
+ - type: rouge
 
27
  value: 20.8149
28
+ name: ROUGE-2
29
  verified: true
30
+ - type: rouge
 
31
  value: 30.6186
32
+ name: ROUGE-L
33
  verified: true
34
+ - type: rouge
 
35
  value: 40.0376
36
+ name: ROUGE-LSUM
37
  verified: true
38
+ - type: loss
 
39
  value: 2.529000997543335
40
+ name: loss
41
  verified: true
42
+ - type: gen_len
 
43
  value: 78.5866
44
+ name: gen_len
45
+ verified: true
46
+ - task:
47
+ type: summarization
48
+ name: Summarization
49
+ dataset:
50
+ name: samsum
51
+ type: samsum
52
+ config: samsum
53
+ split: test
54
+ metrics:
55
+ - type: rouge
56
+ value: 30.7603
57
+ name: ROUGE-1
58
+ verified: true
59
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDYxYjgyZDNmMGEwMmU1MjQwZjg2MTJiMTJmNzAzNWNhZWNiNjk4YTBiM2YwNzljN2FlYTUwMmQyMzgyNTkxNiIsInZlcnNpb24iOjF9.KY5rCCPp6yugf_i0ox6OLOckgfdIJ3cZ8PoMg9V1mZ_qLxJ0tO2HvKtCkjgg9mgqWovM1b-1QKl-crItB0m2CQ
60
+ - type: rouge
61
+ value: 10.2478
62
+ name: ROUGE-2
63
+ verified: true
64
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNzhlNjhkZmRhMGYxOGQyMmMyMGJhY2FlYmY3NjFjOGFiZGM0MzdjOTc4YTE0N2MwNWZkZGZmZWE1NWI2MTg1NSIsInZlcnNpb24iOjF9.dBlclY9GzPBxvxRSiE9JuACh0KleJsnqAVCaFwHGGTXWqwCkgr_A_h0W4O5iuzB6Mq---tF3_-1JutofPHw5AQ
65
+ - type: rouge
66
+ value: 23.1045
67
+ name: ROUGE-L
68
+ verified: true
69
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjllYTk0NzQyMGQwZDcxMjdjMmQ3NjA0ZGE1YWFkM2MwNzI2NDc4MDA1YzQ3YjM1ZjhjMTVkMGExOGU0ZmM5MyIsInZlcnNpb24iOjF9.RmZ4OtuSl9ux7eZj0FdUdFOibN5rr5e4mIToq8adX8mWgm8nzHUxInc0lo7RjOJHdFasUYHh-jxuhy11zXB4Ag
70
+ - type: rouge
71
+ value: 28.6384
72
+ name: ROUGE-LSUM
73
+ verified: true
74
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjhlYTg5MTQ1ODAzZGUxOGEzYjI4YTA3MTA1MmNkNDViYTk4ZWVhZWUwNzczMDgyZWViMWVkODYzYmI2MDExOCIsInZlcnNpb24iOjF9.Hg0ERMXrgsie9MElsQD2tZYZfkptrrVRxt_eREzFLrfpdzT52R75YLO9jCPPxPyUzflY05hA13DhLmQh-_73Cg
75
+ - type: loss
76
+ value: 2.1912083625793457
77
+ name: loss
78
+ verified: true
79
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMDU0MTNkMTcxYjI4MjAzZjdmYjIyMDRiZDQ1NzI2MjRjM2QyNzU0MTliOTA5MDE3ZmIyYmY2NzI0MjE0OWM1NyIsInZlcnNpb24iOjF9.Z7ezEIG_ovOGFCsCnMLg4Wcede5cBlZP0lRbks9w9ceuSCESp8Qdeksa8S7pHpGBCBbOwR1xFyMOOxZZAp9pDA
80
+ - type: gen_len
81
+ value: 66.6813
82
+ name: gen_len
83
  verified: true
84
+ verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOTRmMWYwMzgyZjVkZjk4YjZlNGZiODhhNTc0YjI5MmFmMWJhYWNlNTIyMDU2NTM0OTc5YTVmNWQ5MGYxZjBkMSIsInZlcnNpb24iOjF9.l95E7CZ_UaQ5Cke_7l6MNoqyRXah6fLZTC7e2FYRGPp8dst-Ke-fyB-o7TdKFV_2tXYtz2J5PWmunYf9Oe3QBA
85
  ---
86
  # BART (large-sized model), fine-tuned on CNN Daily Mail
87