Remove ` (default)` from MTEB metadata (#1)
Browse files- Remove ` (default)` from MTEB metadata (51793d5659473e0dfd51f8ae132e79d3aff8f947)
Co-authored-by: Tom Aarsen <[email protected]>
README.md
CHANGED
@@ -29,7 +29,7 @@ model-index:
|
|
29 |
type: Classification
|
30 |
- dataset:
|
31 |
config: default
|
32 |
-
name: MTEB AmazonPolarityClassification
|
33 |
revision: e2d317d38cd51312af73b3d32a06d1a08b442046
|
34 |
split: test
|
35 |
type: mteb/amazon_polarity
|
@@ -71,7 +71,7 @@ model-index:
|
|
71 |
type: Classification
|
72 |
- dataset:
|
73 |
config: default
|
74 |
-
name: MTEB ArguAna
|
75 |
revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
|
76 |
split: test
|
77 |
type: mteb/arguana
|
@@ -142,7 +142,7 @@ model-index:
|
|
142 |
type: Retrieval
|
143 |
- dataset:
|
144 |
config: default
|
145 |
-
name: MTEB ArxivClusteringP2P
|
146 |
revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
|
147 |
split: test
|
148 |
type: mteb/arxiv-clustering-p2p
|
@@ -157,7 +157,7 @@ model-index:
|
|
157 |
type: Clustering
|
158 |
- dataset:
|
159 |
config: default
|
160 |
-
name: MTEB ArxivClusteringS2S
|
161 |
revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
|
162 |
split: test
|
163 |
type: mteb/arxiv-clustering-s2s
|
@@ -172,7 +172,7 @@ model-index:
|
|
172 |
type: Clustering
|
173 |
- dataset:
|
174 |
config: default
|
175 |
-
name: MTEB AskUbuntuDupQuestions
|
176 |
revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
|
177 |
split: test
|
178 |
type: mteb/askubuntudupquestions-reranking
|
@@ -187,7 +187,7 @@ model-index:
|
|
187 |
type: Reranking
|
188 |
- dataset:
|
189 |
config: default
|
190 |
-
name: MTEB BIOSSES
|
191 |
revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
|
192 |
split: test
|
193 |
type: mteb/biosses-sts
|
@@ -210,7 +210,7 @@ model-index:
|
|
210 |
type: STS
|
211 |
- dataset:
|
212 |
config: default
|
213 |
-
name: MTEB Banking77Classification
|
214 |
revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
|
215 |
split: test
|
216 |
type: mteb/banking77
|
@@ -229,7 +229,7 @@ model-index:
|
|
229 |
type: Classification
|
230 |
- dataset:
|
231 |
config: default
|
232 |
-
name: MTEB BiorxivClusteringP2P
|
233 |
revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
|
234 |
split: test
|
235 |
type: mteb/biorxiv-clustering-p2p
|
@@ -244,7 +244,7 @@ model-index:
|
|
244 |
type: Clustering
|
245 |
- dataset:
|
246 |
config: default
|
247 |
-
name: MTEB BiorxivClusteringS2S
|
248 |
revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
|
249 |
split: test
|
250 |
type: mteb/biorxiv-clustering-s2s
|
@@ -259,7 +259,7 @@ model-index:
|
|
259 |
type: Clustering
|
260 |
- dataset:
|
261 |
config: default
|
262 |
-
name: MTEB CQADupstackRetrieval
|
263 |
revision: 46989137a86843e03a6195de44b09deda022eec7
|
264 |
split: test
|
265 |
type: CQADupstackRetrieval_is_a_combined_dataset
|
@@ -330,7 +330,7 @@ model-index:
|
|
330 |
type: Retrieval
|
331 |
- dataset:
|
332 |
config: default
|
333 |
-
name: MTEB ClimateFEVER
|
334 |
revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
|
335 |
split: test
|
336 |
type: mteb/climate-fever
|
@@ -401,7 +401,7 @@ model-index:
|
|
401 |
type: Retrieval
|
402 |
- dataset:
|
403 |
config: default
|
404 |
-
name: MTEB DBPedia
|
405 |
revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
|
406 |
split: test
|
407 |
type: mteb/dbpedia
|
@@ -472,7 +472,7 @@ model-index:
|
|
472 |
type: Retrieval
|
473 |
- dataset:
|
474 |
config: default
|
475 |
-
name: MTEB EmotionClassification
|
476 |
revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
|
477 |
split: test
|
478 |
type: mteb/emotion
|
@@ -491,7 +491,7 @@ model-index:
|
|
491 |
type: Classification
|
492 |
- dataset:
|
493 |
config: default
|
494 |
-
name: MTEB FEVER
|
495 |
revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
|
496 |
split: test
|
497 |
type: mteb/fever
|
@@ -562,7 +562,7 @@ model-index:
|
|
562 |
type: Retrieval
|
563 |
- dataset:
|
564 |
config: default
|
565 |
-
name: MTEB FiQA2018
|
566 |
revision: 27a168819829fe9bcd655c2df245fb19452e8e06
|
567 |
split: test
|
568 |
type: mteb/fiqa
|
@@ -633,7 +633,7 @@ model-index:
|
|
633 |
type: Retrieval
|
634 |
- dataset:
|
635 |
config: default
|
636 |
-
name: MTEB HotpotQA
|
637 |
revision: ab518f4d6fcca38d87c25209f94beba119d02014
|
638 |
split: test
|
639 |
type: mteb/hotpotqa
|
@@ -704,7 +704,7 @@ model-index:
|
|
704 |
type: Retrieval
|
705 |
- dataset:
|
706 |
config: default
|
707 |
-
name: MTEB ImdbClassification
|
708 |
revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
|
709 |
split: test
|
710 |
type: mteb/imdb
|
@@ -727,7 +727,7 @@ model-index:
|
|
727 |
type: Classification
|
728 |
- dataset:
|
729 |
config: default
|
730 |
-
name: MTEB MSMARCO
|
731 |
revision: c5a29a104738b98a9e76336939199e264163d4a0
|
732 |
split: dev
|
733 |
type: mteb/msmarco
|
@@ -874,7 +874,7 @@ model-index:
|
|
874 |
type: Classification
|
875 |
- dataset:
|
876 |
config: default
|
877 |
-
name: MTEB MedrxivClusteringP2P
|
878 |
revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
|
879 |
split: test
|
880 |
type: mteb/medrxiv-clustering-p2p
|
@@ -889,7 +889,7 @@ model-index:
|
|
889 |
type: Clustering
|
890 |
- dataset:
|
891 |
config: default
|
892 |
-
name: MTEB MedrxivClusteringS2S
|
893 |
revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
|
894 |
split: test
|
895 |
type: mteb/medrxiv-clustering-s2s
|
@@ -904,7 +904,7 @@ model-index:
|
|
904 |
type: Clustering
|
905 |
- dataset:
|
906 |
config: default
|
907 |
-
name: MTEB MindSmallReranking
|
908 |
revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
|
909 |
split: test
|
910 |
type: mteb/mind_small
|
@@ -919,7 +919,7 @@ model-index:
|
|
919 |
type: Reranking
|
920 |
- dataset:
|
921 |
config: default
|
922 |
-
name: MTEB NFCorpus
|
923 |
revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
|
924 |
split: test
|
925 |
type: mteb/nfcorpus
|
@@ -990,7 +990,7 @@ model-index:
|
|
990 |
type: Retrieval
|
991 |
- dataset:
|
992 |
config: default
|
993 |
-
name: MTEB NQ
|
994 |
revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
|
995 |
split: test
|
996 |
type: mteb/nq
|
@@ -1061,7 +1061,7 @@ model-index:
|
|
1061 |
type: Retrieval
|
1062 |
- dataset:
|
1063 |
config: default
|
1064 |
-
name: MTEB QuoraRetrieval
|
1065 |
revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
|
1066 |
split: test
|
1067 |
type: mteb/quora
|
@@ -1132,7 +1132,7 @@ model-index:
|
|
1132 |
type: Retrieval
|
1133 |
- dataset:
|
1134 |
config: default
|
1135 |
-
name: MTEB RedditClustering
|
1136 |
revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
|
1137 |
split: test
|
1138 |
type: mteb/reddit-clustering
|
@@ -1147,7 +1147,7 @@ model-index:
|
|
1147 |
type: Clustering
|
1148 |
- dataset:
|
1149 |
config: default
|
1150 |
-
name: MTEB RedditClusteringP2P
|
1151 |
revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
|
1152 |
split: test
|
1153 |
type: mteb/reddit-clustering-p2p
|
@@ -1162,7 +1162,7 @@ model-index:
|
|
1162 |
type: Clustering
|
1163 |
- dataset:
|
1164 |
config: default
|
1165 |
-
name: MTEB SCIDOCS
|
1166 |
revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
|
1167 |
split: test
|
1168 |
type: mteb/scidocs
|
@@ -1233,7 +1233,7 @@ model-index:
|
|
1233 |
type: Retrieval
|
1234 |
- dataset:
|
1235 |
config: default
|
1236 |
-
name: MTEB SICK-R
|
1237 |
revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
|
1238 |
split: test
|
1239 |
type: mteb/sickr-sts
|
@@ -1256,7 +1256,7 @@ model-index:
|
|
1256 |
type: STS
|
1257 |
- dataset:
|
1258 |
config: default
|
1259 |
-
name: MTEB STS12
|
1260 |
revision: a0d554a64d88156834ff5ae9920b964011b16384
|
1261 |
split: test
|
1262 |
type: mteb/sts12-sts
|
@@ -1279,7 +1279,7 @@ model-index:
|
|
1279 |
type: STS
|
1280 |
- dataset:
|
1281 |
config: default
|
1282 |
-
name: MTEB STS13
|
1283 |
revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
|
1284 |
split: test
|
1285 |
type: mteb/sts13-sts
|
@@ -1302,7 +1302,7 @@ model-index:
|
|
1302 |
type: STS
|
1303 |
- dataset:
|
1304 |
config: default
|
1305 |
-
name: MTEB STS14
|
1306 |
revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
|
1307 |
split: test
|
1308 |
type: mteb/sts14-sts
|
@@ -1325,7 +1325,7 @@ model-index:
|
|
1325 |
type: STS
|
1326 |
- dataset:
|
1327 |
config: default
|
1328 |
-
name: MTEB STS15
|
1329 |
revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
|
1330 |
split: test
|
1331 |
type: mteb/sts15-sts
|
@@ -1348,7 +1348,7 @@ model-index:
|
|
1348 |
type: STS
|
1349 |
- dataset:
|
1350 |
config: default
|
1351 |
-
name: MTEB STS16
|
1352 |
revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
|
1353 |
split: test
|
1354 |
type: mteb/sts16-sts
|
@@ -1417,7 +1417,7 @@ model-index:
|
|
1417 |
type: STS
|
1418 |
- dataset:
|
1419 |
config: default
|
1420 |
-
name: MTEB STSBenchmark
|
1421 |
revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
|
1422 |
split: test
|
1423 |
type: mteb/stsbenchmark-sts
|
@@ -1440,7 +1440,7 @@ model-index:
|
|
1440 |
type: STS
|
1441 |
- dataset:
|
1442 |
config: default
|
1443 |
-
name: MTEB SciDocsRR
|
1444 |
revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
|
1445 |
split: test
|
1446 |
type: mteb/scidocs-reranking
|
@@ -1455,7 +1455,7 @@ model-index:
|
|
1455 |
type: Reranking
|
1456 |
- dataset:
|
1457 |
config: default
|
1458 |
-
name: MTEB SciFact
|
1459 |
revision: 0228b52cf27578f30900b9e5271d331663a030d7
|
1460 |
split: test
|
1461 |
type: mteb/scifact
|
@@ -1526,7 +1526,7 @@ model-index:
|
|
1526 |
type: Retrieval
|
1527 |
- dataset:
|
1528 |
config: default
|
1529 |
-
name: MTEB SprintDuplicateQuestions
|
1530 |
revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
|
1531 |
split: test
|
1532 |
type: mteb/sprintduplicatequestions-pairclassification
|
@@ -1597,7 +1597,7 @@ model-index:
|
|
1597 |
type: PairClassification
|
1598 |
- dataset:
|
1599 |
config: default
|
1600 |
-
name: MTEB StackExchangeClustering
|
1601 |
revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
|
1602 |
split: test
|
1603 |
type: mteb/stackexchange-clustering
|
@@ -1612,7 +1612,7 @@ model-index:
|
|
1612 |
type: Clustering
|
1613 |
- dataset:
|
1614 |
config: default
|
1615 |
-
name: MTEB StackExchangeClusteringP2P
|
1616 |
revision: 815ca46b2622cec33ccafc3735d572c266efdb44
|
1617 |
split: test
|
1618 |
type: mteb/stackexchange-clustering-p2p
|
@@ -1627,7 +1627,7 @@ model-index:
|
|
1627 |
type: Clustering
|
1628 |
- dataset:
|
1629 |
config: default
|
1630 |
-
name: MTEB StackOverflowDupQuestions
|
1631 |
revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
|
1632 |
split: test
|
1633 |
type: mteb/stackoverflowdupquestions-reranking
|
@@ -1642,7 +1642,7 @@ model-index:
|
|
1642 |
type: Reranking
|
1643 |
- dataset:
|
1644 |
config: default
|
1645 |
-
name: MTEB SummEval
|
1646 |
revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
|
1647 |
split: test
|
1648 |
type: mteb/summeval
|
@@ -1661,7 +1661,7 @@ model-index:
|
|
1661 |
type: Summarization
|
1662 |
- dataset:
|
1663 |
config: default
|
1664 |
-
name: MTEB TRECCOVID
|
1665 |
revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
|
1666 |
split: test
|
1667 |
type: mteb/trec-covid
|
@@ -1732,7 +1732,7 @@ model-index:
|
|
1732 |
type: Retrieval
|
1733 |
- dataset:
|
1734 |
config: default
|
1735 |
-
name: MTEB Touche2020
|
1736 |
revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
|
1737 |
split: test
|
1738 |
type: mteb/touche2020
|
@@ -1803,7 +1803,7 @@ model-index:
|
|
1803 |
type: Retrieval
|
1804 |
- dataset:
|
1805 |
config: default
|
1806 |
-
name: MTEB ToxicConversationsClassification
|
1807 |
revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
|
1808 |
split: test
|
1809 |
type: mteb/toxic_conversations_50k
|
@@ -1826,7 +1826,7 @@ model-index:
|
|
1826 |
type: Classification
|
1827 |
- dataset:
|
1828 |
config: default
|
1829 |
-
name: MTEB TweetSentimentExtractionClassification
|
1830 |
revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
|
1831 |
split: test
|
1832 |
type: mteb/tweet_sentiment_extraction
|
@@ -1845,7 +1845,7 @@ model-index:
|
|
1845 |
type: Classification
|
1846 |
- dataset:
|
1847 |
config: default
|
1848 |
-
name: MTEB TwentyNewsgroupsClustering
|
1849 |
revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
|
1850 |
split: test
|
1851 |
type: mteb/twentynewsgroups-clustering
|
@@ -1860,7 +1860,7 @@ model-index:
|
|
1860 |
type: Clustering
|
1861 |
- dataset:
|
1862 |
config: default
|
1863 |
-
name: MTEB TwitterSemEval2015
|
1864 |
revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
|
1865 |
split: test
|
1866 |
type: mteb/twittersemeval2015-pairclassification
|
@@ -1931,7 +1931,7 @@ model-index:
|
|
1931 |
type: PairClassification
|
1932 |
- dataset:
|
1933 |
config: default
|
1934 |
-
name: MTEB TwitterURLCorpus
|
1935 |
revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
|
1936 |
split: test
|
1937 |
type: mteb/twitterurlcorpus-pairclassification
|
|
|
29 |
type: Classification
|
30 |
- dataset:
|
31 |
config: default
|
32 |
+
name: MTEB AmazonPolarityClassification
|
33 |
revision: e2d317d38cd51312af73b3d32a06d1a08b442046
|
34 |
split: test
|
35 |
type: mteb/amazon_polarity
|
|
|
71 |
type: Classification
|
72 |
- dataset:
|
73 |
config: default
|
74 |
+
name: MTEB ArguAna
|
75 |
revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
|
76 |
split: test
|
77 |
type: mteb/arguana
|
|
|
142 |
type: Retrieval
|
143 |
- dataset:
|
144 |
config: default
|
145 |
+
name: MTEB ArxivClusteringP2P
|
146 |
revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
|
147 |
split: test
|
148 |
type: mteb/arxiv-clustering-p2p
|
|
|
157 |
type: Clustering
|
158 |
- dataset:
|
159 |
config: default
|
160 |
+
name: MTEB ArxivClusteringS2S
|
161 |
revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
|
162 |
split: test
|
163 |
type: mteb/arxiv-clustering-s2s
|
|
|
172 |
type: Clustering
|
173 |
- dataset:
|
174 |
config: default
|
175 |
+
name: MTEB AskUbuntuDupQuestions
|
176 |
revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
|
177 |
split: test
|
178 |
type: mteb/askubuntudupquestions-reranking
|
|
|
187 |
type: Reranking
|
188 |
- dataset:
|
189 |
config: default
|
190 |
+
name: MTEB BIOSSES
|
191 |
revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
|
192 |
split: test
|
193 |
type: mteb/biosses-sts
|
|
|
210 |
type: STS
|
211 |
- dataset:
|
212 |
config: default
|
213 |
+
name: MTEB Banking77Classification
|
214 |
revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
|
215 |
split: test
|
216 |
type: mteb/banking77
|
|
|
229 |
type: Classification
|
230 |
- dataset:
|
231 |
config: default
|
232 |
+
name: MTEB BiorxivClusteringP2P
|
233 |
revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
|
234 |
split: test
|
235 |
type: mteb/biorxiv-clustering-p2p
|
|
|
244 |
type: Clustering
|
245 |
- dataset:
|
246 |
config: default
|
247 |
+
name: MTEB BiorxivClusteringS2S
|
248 |
revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
|
249 |
split: test
|
250 |
type: mteb/biorxiv-clustering-s2s
|
|
|
259 |
type: Clustering
|
260 |
- dataset:
|
261 |
config: default
|
262 |
+
name: MTEB CQADupstackRetrieval
|
263 |
revision: 46989137a86843e03a6195de44b09deda022eec7
|
264 |
split: test
|
265 |
type: CQADupstackRetrieval_is_a_combined_dataset
|
|
|
330 |
type: Retrieval
|
331 |
- dataset:
|
332 |
config: default
|
333 |
+
name: MTEB ClimateFEVER
|
334 |
revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
|
335 |
split: test
|
336 |
type: mteb/climate-fever
|
|
|
401 |
type: Retrieval
|
402 |
- dataset:
|
403 |
config: default
|
404 |
+
name: MTEB DBPedia
|
405 |
revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
|
406 |
split: test
|
407 |
type: mteb/dbpedia
|
|
|
472 |
type: Retrieval
|
473 |
- dataset:
|
474 |
config: default
|
475 |
+
name: MTEB EmotionClassification
|
476 |
revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
|
477 |
split: test
|
478 |
type: mteb/emotion
|
|
|
491 |
type: Classification
|
492 |
- dataset:
|
493 |
config: default
|
494 |
+
name: MTEB FEVER
|
495 |
revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
|
496 |
split: test
|
497 |
type: mteb/fever
|
|
|
562 |
type: Retrieval
|
563 |
- dataset:
|
564 |
config: default
|
565 |
+
name: MTEB FiQA2018
|
566 |
revision: 27a168819829fe9bcd655c2df245fb19452e8e06
|
567 |
split: test
|
568 |
type: mteb/fiqa
|
|
|
633 |
type: Retrieval
|
634 |
- dataset:
|
635 |
config: default
|
636 |
+
name: MTEB HotpotQA
|
637 |
revision: ab518f4d6fcca38d87c25209f94beba119d02014
|
638 |
split: test
|
639 |
type: mteb/hotpotqa
|
|
|
704 |
type: Retrieval
|
705 |
- dataset:
|
706 |
config: default
|
707 |
+
name: MTEB ImdbClassification
|
708 |
revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
|
709 |
split: test
|
710 |
type: mteb/imdb
|
|
|
727 |
type: Classification
|
728 |
- dataset:
|
729 |
config: default
|
730 |
+
name: MTEB MSMARCO
|
731 |
revision: c5a29a104738b98a9e76336939199e264163d4a0
|
732 |
split: dev
|
733 |
type: mteb/msmarco
|
|
|
874 |
type: Classification
|
875 |
- dataset:
|
876 |
config: default
|
877 |
+
name: MTEB MedrxivClusteringP2P
|
878 |
revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
|
879 |
split: test
|
880 |
type: mteb/medrxiv-clustering-p2p
|
|
|
889 |
type: Clustering
|
890 |
- dataset:
|
891 |
config: default
|
892 |
+
name: MTEB MedrxivClusteringS2S
|
893 |
revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
|
894 |
split: test
|
895 |
type: mteb/medrxiv-clustering-s2s
|
|
|
904 |
type: Clustering
|
905 |
- dataset:
|
906 |
config: default
|
907 |
+
name: MTEB MindSmallReranking
|
908 |
revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
|
909 |
split: test
|
910 |
type: mteb/mind_small
|
|
|
919 |
type: Reranking
|
920 |
- dataset:
|
921 |
config: default
|
922 |
+
name: MTEB NFCorpus
|
923 |
revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
|
924 |
split: test
|
925 |
type: mteb/nfcorpus
|
|
|
990 |
type: Retrieval
|
991 |
- dataset:
|
992 |
config: default
|
993 |
+
name: MTEB NQ
|
994 |
revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
|
995 |
split: test
|
996 |
type: mteb/nq
|
|
|
1061 |
type: Retrieval
|
1062 |
- dataset:
|
1063 |
config: default
|
1064 |
+
name: MTEB QuoraRetrieval
|
1065 |
revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
|
1066 |
split: test
|
1067 |
type: mteb/quora
|
|
|
1132 |
type: Retrieval
|
1133 |
- dataset:
|
1134 |
config: default
|
1135 |
+
name: MTEB RedditClustering
|
1136 |
revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
|
1137 |
split: test
|
1138 |
type: mteb/reddit-clustering
|
|
|
1147 |
type: Clustering
|
1148 |
- dataset:
|
1149 |
config: default
|
1150 |
+
name: MTEB RedditClusteringP2P
|
1151 |
revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
|
1152 |
split: test
|
1153 |
type: mteb/reddit-clustering-p2p
|
|
|
1162 |
type: Clustering
|
1163 |
- dataset:
|
1164 |
config: default
|
1165 |
+
name: MTEB SCIDOCS
|
1166 |
revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
|
1167 |
split: test
|
1168 |
type: mteb/scidocs
|
|
|
1233 |
type: Retrieval
|
1234 |
- dataset:
|
1235 |
config: default
|
1236 |
+
name: MTEB SICK-R
|
1237 |
revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
|
1238 |
split: test
|
1239 |
type: mteb/sickr-sts
|
|
|
1256 |
type: STS
|
1257 |
- dataset:
|
1258 |
config: default
|
1259 |
+
name: MTEB STS12
|
1260 |
revision: a0d554a64d88156834ff5ae9920b964011b16384
|
1261 |
split: test
|
1262 |
type: mteb/sts12-sts
|
|
|
1279 |
type: STS
|
1280 |
- dataset:
|
1281 |
config: default
|
1282 |
+
name: MTEB STS13
|
1283 |
revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
|
1284 |
split: test
|
1285 |
type: mteb/sts13-sts
|
|
|
1302 |
type: STS
|
1303 |
- dataset:
|
1304 |
config: default
|
1305 |
+
name: MTEB STS14
|
1306 |
revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
|
1307 |
split: test
|
1308 |
type: mteb/sts14-sts
|
|
|
1325 |
type: STS
|
1326 |
- dataset:
|
1327 |
config: default
|
1328 |
+
name: MTEB STS15
|
1329 |
revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
|
1330 |
split: test
|
1331 |
type: mteb/sts15-sts
|
|
|
1348 |
type: STS
|
1349 |
- dataset:
|
1350 |
config: default
|
1351 |
+
name: MTEB STS16
|
1352 |
revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
|
1353 |
split: test
|
1354 |
type: mteb/sts16-sts
|
|
|
1417 |
type: STS
|
1418 |
- dataset:
|
1419 |
config: default
|
1420 |
+
name: MTEB STSBenchmark
|
1421 |
revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
|
1422 |
split: test
|
1423 |
type: mteb/stsbenchmark-sts
|
|
|
1440 |
type: STS
|
1441 |
- dataset:
|
1442 |
config: default
|
1443 |
+
name: MTEB SciDocsRR
|
1444 |
revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
|
1445 |
split: test
|
1446 |
type: mteb/scidocs-reranking
|
|
|
1455 |
type: Reranking
|
1456 |
- dataset:
|
1457 |
config: default
|
1458 |
+
name: MTEB SciFact
|
1459 |
revision: 0228b52cf27578f30900b9e5271d331663a030d7
|
1460 |
split: test
|
1461 |
type: mteb/scifact
|
|
|
1526 |
type: Retrieval
|
1527 |
- dataset:
|
1528 |
config: default
|
1529 |
+
name: MTEB SprintDuplicateQuestions
|
1530 |
revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
|
1531 |
split: test
|
1532 |
type: mteb/sprintduplicatequestions-pairclassification
|
|
|
1597 |
type: PairClassification
|
1598 |
- dataset:
|
1599 |
config: default
|
1600 |
+
name: MTEB StackExchangeClustering
|
1601 |
revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
|
1602 |
split: test
|
1603 |
type: mteb/stackexchange-clustering
|
|
|
1612 |
type: Clustering
|
1613 |
- dataset:
|
1614 |
config: default
|
1615 |
+
name: MTEB StackExchangeClusteringP2P
|
1616 |
revision: 815ca46b2622cec33ccafc3735d572c266efdb44
|
1617 |
split: test
|
1618 |
type: mteb/stackexchange-clustering-p2p
|
|
|
1627 |
type: Clustering
|
1628 |
- dataset:
|
1629 |
config: default
|
1630 |
+
name: MTEB StackOverflowDupQuestions
|
1631 |
revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
|
1632 |
split: test
|
1633 |
type: mteb/stackoverflowdupquestions-reranking
|
|
|
1642 |
type: Reranking
|
1643 |
- dataset:
|
1644 |
config: default
|
1645 |
+
name: MTEB SummEval
|
1646 |
revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
|
1647 |
split: test
|
1648 |
type: mteb/summeval
|
|
|
1661 |
type: Summarization
|
1662 |
- dataset:
|
1663 |
config: default
|
1664 |
+
name: MTEB TRECCOVID
|
1665 |
revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
|
1666 |
split: test
|
1667 |
type: mteb/trec-covid
|
|
|
1732 |
type: Retrieval
|
1733 |
- dataset:
|
1734 |
config: default
|
1735 |
+
name: MTEB Touche2020
|
1736 |
revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
|
1737 |
split: test
|
1738 |
type: mteb/touche2020
|
|
|
1803 |
type: Retrieval
|
1804 |
- dataset:
|
1805 |
config: default
|
1806 |
+
name: MTEB ToxicConversationsClassification
|
1807 |
revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
|
1808 |
split: test
|
1809 |
type: mteb/toxic_conversations_50k
|
|
|
1826 |
type: Classification
|
1827 |
- dataset:
|
1828 |
config: default
|
1829 |
+
name: MTEB TweetSentimentExtractionClassification
|
1830 |
revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
|
1831 |
split: test
|
1832 |
type: mteb/tweet_sentiment_extraction
|
|
|
1845 |
type: Classification
|
1846 |
- dataset:
|
1847 |
config: default
|
1848 |
+
name: MTEB TwentyNewsgroupsClustering
|
1849 |
revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
|
1850 |
split: test
|
1851 |
type: mteb/twentynewsgroups-clustering
|
|
|
1860 |
type: Clustering
|
1861 |
- dataset:
|
1862 |
config: default
|
1863 |
+
name: MTEB TwitterSemEval2015
|
1864 |
revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
|
1865 |
split: test
|
1866 |
type: mteb/twittersemeval2015-pairclassification
|
|
|
1931 |
type: PairClassification
|
1932 |
- dataset:
|
1933 |
config: default
|
1934 |
+
name: MTEB TwitterURLCorpus
|
1935 |
revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
|
1936 |
split: test
|
1937 |
type: mteb/twitterurlcorpus-pairclassification
|