Muennighoff commited on
Commit
79d71b4
1 Parent(s): 2f6b75f

Add revisions

Browse files
Files changed (1) hide show
  1. README.md +68 -0
README.md CHANGED
@@ -39,6 +39,7 @@ model-index:
39
  name: MTEB AmazonCounterfactualClassification (en)
40
  config: en
41
  split: test
 
42
  metrics:
43
  - type: accuracy
44
  value: 65.26865671641791
@@ -53,6 +54,7 @@ model-index:
53
  name: MTEB AmazonPolarityClassification
54
  config: default
55
  split: test
 
56
  metrics:
57
  - type: accuracy
58
  value: 67.13145
@@ -67,6 +69,7 @@ model-index:
67
  name: MTEB AmazonReviewsClassification (en)
68
  config: en
69
  split: test
 
70
  metrics:
71
  - type: accuracy
72
  value: 31.920000000000005
@@ -79,6 +82,7 @@ model-index:
79
  name: MTEB ArguAna
80
  config: default
81
  split: test
 
82
  metrics:
83
  - type: map_at_1
84
  value: 23.186
@@ -135,6 +139,7 @@ model-index:
135
  name: MTEB ArxivClusteringP2P
136
  config: default
137
  split: test
 
138
  metrics:
139
  - type: v_measure
140
  value: 48.37886340922374
@@ -145,6 +150,7 @@ model-index:
145
  name: MTEB ArxivClusteringS2S
146
  config: default
147
  split: test
 
148
  metrics:
149
  - type: v_measure
150
  value: 39.72488615315985
@@ -155,6 +161,7 @@ model-index:
155
  name: MTEB AskUbuntuDupQuestions
156
  config: default
157
  split: test
 
158
  metrics:
159
  - type: map
160
  value: 65.85199009344481
@@ -167,6 +174,7 @@ model-index:
167
  name: MTEB BIOSSES
168
  config: default
169
  split: test
 
170
  metrics:
171
  - type: cos_sim_pearson
172
  value: 84.47737119217858
@@ -187,6 +195,7 @@ model-index:
187
  name: MTEB Banking77Classification
188
  config: default
189
  split: test
 
190
  metrics:
191
  - type: accuracy
192
  value: 81.8603896103896
@@ -199,6 +208,7 @@ model-index:
199
  name: MTEB BiorxivClusteringP2P
200
  config: default
201
  split: test
 
202
  metrics:
203
  - type: v_measure
204
  value: 39.616605133625185
@@ -209,6 +219,7 @@ model-index:
209
  name: MTEB BiorxivClusteringS2S
210
  config: default
211
  split: test
 
212
  metrics:
213
  - type: v_measure
214
  value: 35.02442407186902
@@ -219,6 +230,7 @@ model-index:
219
  name: MTEB CQADupstackAndroidRetrieval
220
  config: default
221
  split: test
 
222
  metrics:
223
  - type: map_at_1
224
  value: 36.036
@@ -275,6 +287,7 @@ model-index:
275
  name: MTEB CQADupstackEnglishRetrieval
276
  config: default
277
  split: test
 
278
  metrics:
279
  - type: map_at_1
280
  value: 32.92
@@ -331,6 +344,7 @@ model-index:
331
  name: MTEB CQADupstackGamingRetrieval
332
  config: default
333
  split: test
 
334
  metrics:
335
  - type: map_at_1
336
  value: 40.695
@@ -387,6 +401,7 @@ model-index:
387
  name: MTEB CQADupstackGisRetrieval
388
  config: default
389
  split: test
 
390
  metrics:
391
  - type: map_at_1
392
  value: 29.024
@@ -443,6 +458,7 @@ model-index:
443
  name: MTEB CQADupstackMathematicaRetrieval
444
  config: default
445
  split: test
 
446
  metrics:
447
  - type: map_at_1
448
  value: 17.774
@@ -499,6 +515,7 @@ model-index:
499
  name: MTEB CQADupstackPhysicsRetrieval
500
  config: default
501
  split: test
 
502
  metrics:
503
  - type: map_at_1
504
  value: 31.885
@@ -555,6 +572,7 @@ model-index:
555
  name: MTEB CQADupstackProgrammersRetrieval
556
  config: default
557
  split: test
 
558
  metrics:
559
  - type: map_at_1
560
  value: 26.454
@@ -611,6 +629,7 @@ model-index:
611
  name: MTEB CQADupstackRetrieval
612
  config: default
613
  split: test
 
614
  metrics:
615
  - type: map_at_1
616
  value: 27.743666666666666
@@ -667,6 +686,7 @@ model-index:
667
  name: MTEB CQADupstackStatsRetrieval
668
  config: default
669
  split: test
 
670
  metrics:
671
  - type: map_at_1
672
  value: 25.244
@@ -723,6 +743,7 @@ model-index:
723
  name: MTEB CQADupstackTexRetrieval
724
  config: default
725
  split: test
 
726
  metrics:
727
  - type: map_at_1
728
  value: 18.857
@@ -779,6 +800,7 @@ model-index:
779
  name: MTEB CQADupstackUnixRetrieval
780
  config: default
781
  split: test
 
782
  metrics:
783
  - type: map_at_1
784
  value: 27.486
@@ -835,6 +857,7 @@ model-index:
835
  name: MTEB CQADupstackWebmastersRetrieval
836
  config: default
837
  split: test
 
838
  metrics:
839
  - type: map_at_1
840
  value: 26.207
@@ -891,6 +914,7 @@ model-index:
891
  name: MTEB CQADupstackWordpressRetrieval
892
  config: default
893
  split: test
 
894
  metrics:
895
  - type: map_at_1
896
  value: 20.342
@@ -947,6 +971,7 @@ model-index:
947
  name: MTEB ClimateFEVER
948
  config: default
949
  split: test
 
950
  metrics:
951
  - type: map_at_1
952
  value: 7.71
@@ -1003,6 +1028,7 @@ model-index:
1003
  name: MTEB DBPedia
1004
  config: default
1005
  split: test
 
1006
  metrics:
1007
  - type: map_at_1
1008
  value: 6.8180000000000005
@@ -1059,6 +1085,7 @@ model-index:
1059
  name: MTEB EmotionClassification
1060
  config: default
1061
  split: test
 
1062
  metrics:
1063
  - type: accuracy
1064
  value: 39.725
@@ -1071,6 +1098,7 @@ model-index:
1071
  name: MTEB FEVER
1072
  config: default
1073
  split: test
 
1074
  metrics:
1075
  - type: map_at_1
1076
  value: 31.901000000000003
@@ -1127,6 +1155,7 @@ model-index:
1127
  name: MTEB FiQA2018
1128
  config: default
1129
  split: test
 
1130
  metrics:
1131
  - type: map_at_1
1132
  value: 24.4
@@ -1183,6 +1212,7 @@ model-index:
1183
  name: MTEB HotpotQA
1184
  config: default
1185
  split: test
 
1186
  metrics:
1187
  - type: map_at_1
1188
  value: 22.262
@@ -1239,6 +1269,7 @@ model-index:
1239
  name: MTEB ImdbClassification
1240
  config: default
1241
  split: test
 
1242
  metrics:
1243
  - type: accuracy
1244
  value: 70.7156
@@ -1253,6 +1284,7 @@ model-index:
1253
  name: MTEB MSMARCO
1254
  config: default
1255
  split: dev
 
1256
  metrics:
1257
  - type: map_at_1
1258
  value: 21.174
@@ -1309,6 +1341,7 @@ model-index:
1309
  name: MTEB MTOPDomainClassification (en)
1310
  config: en
1311
  split: test
 
1312
  metrics:
1313
  - type: accuracy
1314
  value: 92.07934336525308
@@ -1321,6 +1354,7 @@ model-index:
1321
  name: MTEB MTOPIntentClassification (en)
1322
  config: en
1323
  split: test
 
1324
  metrics:
1325
  - type: accuracy
1326
  value: 70.20975832193344
@@ -1333,6 +1367,7 @@ model-index:
1333
  name: MTEB MassiveIntentClassification (en)
1334
  config: en
1335
  split: test
 
1336
  metrics:
1337
  - type: accuracy
1338
  value: 69.56624075319435
@@ -1345,6 +1380,7 @@ model-index:
1345
  name: MTEB MassiveScenarioClassification (en)
1346
  config: en
1347
  split: test
 
1348
  metrics:
1349
  - type: accuracy
1350
  value: 76.01210490921318
@@ -1357,6 +1393,7 @@ model-index:
1357
  name: MTEB MedrxivClusteringP2P
1358
  config: default
1359
  split: test
 
1360
  metrics:
1361
  - type: v_measure
1362
  value: 35.58002813186373
@@ -1367,6 +1404,7 @@ model-index:
1367
  name: MTEB MedrxivClusteringS2S
1368
  config: default
1369
  split: test
 
1370
  metrics:
1371
  - type: v_measure
1372
  value: 32.872725562410444
@@ -1377,6 +1415,7 @@ model-index:
1377
  name: MTEB MindSmallReranking
1378
  config: default
1379
  split: test
 
1380
  metrics:
1381
  - type: map
1382
  value: 30.965343604861328
@@ -1389,6 +1428,7 @@ model-index:
1389
  name: MTEB NFCorpus
1390
  config: default
1391
  split: test
 
1392
  metrics:
1393
  - type: map_at_1
1394
  value: 4.938
@@ -1445,6 +1485,7 @@ model-index:
1445
  name: MTEB NQ
1446
  config: default
1447
  split: test
 
1448
  metrics:
1449
  - type: map_at_1
1450
  value: 27.124
@@ -1501,6 +1542,7 @@ model-index:
1501
  name: MTEB QuoraRetrieval
1502
  config: default
1503
  split: test
 
1504
  metrics:
1505
  - type: map_at_1
1506
  value: 69.33500000000001
@@ -1557,6 +1599,7 @@ model-index:
1557
  name: MTEB RedditClustering
1558
  config: default
1559
  split: test
 
1560
  metrics:
1561
  - type: v_measure
1562
  value: 54.824256698437324
@@ -1567,6 +1610,7 @@ model-index:
1567
  name: MTEB RedditClusteringP2P
1568
  config: default
1569
  split: test
 
1570
  metrics:
1571
  - type: v_measure
1572
  value: 56.768972678049366
@@ -1577,6 +1621,7 @@ model-index:
1577
  name: MTEB SCIDOCS
1578
  config: default
1579
  split: test
 
1580
  metrics:
1581
  - type: map_at_1
1582
  value: 5.192
@@ -1633,6 +1678,7 @@ model-index:
1633
  name: MTEB SICK-R
1634
  config: default
1635
  split: test
 
1636
  metrics:
1637
  - type: cos_sim_pearson
1638
  value: 84.00280838354293
@@ -1653,6 +1699,7 @@ model-index:
1653
  name: MTEB STS12
1654
  config: default
1655
  split: test
 
1656
  metrics:
1657
  - type: cos_sim_pearson
1658
  value: 83.2801353818369
@@ -1673,6 +1720,7 @@ model-index:
1673
  name: MTEB STS13
1674
  config: default
1675
  split: test
 
1676
  metrics:
1677
  - type: cos_sim_pearson
1678
  value: 83.20700572036095
@@ -1693,6 +1741,7 @@ model-index:
1693
  name: MTEB STS14
1694
  config: default
1695
  split: test
 
1696
  metrics:
1697
  - type: cos_sim_pearson
1698
  value: 82.27113025749529
@@ -1713,6 +1762,7 @@ model-index:
1713
  name: MTEB STS15
1714
  config: default
1715
  split: test
 
1716
  metrics:
1717
  - type: cos_sim_pearson
1718
  value: 84.98824030948605
@@ -1733,6 +1783,7 @@ model-index:
1733
  name: MTEB STS16
1734
  config: default
1735
  split: test
 
1736
  metrics:
1737
  - type: cos_sim_pearson
1738
  value: 78.82478639193744
@@ -1753,6 +1804,7 @@ model-index:
1753
  name: MTEB STS17 (en-en)
1754
  config: en-en
1755
  split: test
 
1756
  metrics:
1757
  - type: cos_sim_pearson
1758
  value: 90.90804154377126
@@ -1773,6 +1825,7 @@ model-index:
1773
  name: MTEB STS22 (en)
1774
  config: en
1775
  split: test
 
1776
  metrics:
1777
  - type: cos_sim_pearson
1778
  value: 66.78771571400975
@@ -1793,6 +1846,7 @@ model-index:
1793
  name: MTEB STSBenchmark
1794
  config: default
1795
  split: test
 
1796
  metrics:
1797
  - type: cos_sim_pearson
1798
  value: 84.03996099800993
@@ -1813,6 +1867,7 @@ model-index:
1813
  name: MTEB SciDocsRR
1814
  config: default
1815
  split: test
 
1816
  metrics:
1817
  - type: map
1818
  value: 88.65396986895777
@@ -1825,6 +1880,7 @@ model-index:
1825
  name: MTEB SciFact
1826
  config: default
1827
  split: test
 
1828
  metrics:
1829
  - type: map_at_1
1830
  value: 51.456
@@ -1881,6 +1937,7 @@ model-index:
1881
  name: MTEB SprintDuplicateQuestions
1882
  config: default
1883
  split: test
 
1884
  metrics:
1885
  - type: cos_sim_accuracy
1886
  value: 99.65940594059406
@@ -1935,6 +1992,7 @@ model-index:
1935
  name: MTEB StackExchangeClustering
1936
  config: default
1937
  split: test
 
1938
  metrics:
1939
  - type: v_measure
1940
  value: 53.80048409076929
@@ -1945,6 +2003,7 @@ model-index:
1945
  name: MTEB StackExchangeClusteringP2P
1946
  config: default
1947
  split: test
 
1948
  metrics:
1949
  - type: v_measure
1950
  value: 34.280269334397545
@@ -1955,6 +2014,7 @@ model-index:
1955
  name: MTEB StackOverflowDupQuestions
1956
  config: default
1957
  split: test
 
1958
  metrics:
1959
  - type: map
1960
  value: 51.97907654945493
@@ -1967,6 +2027,7 @@ model-index:
1967
  name: MTEB SummEval
1968
  config: default
1969
  split: test
 
1970
  metrics:
1971
  - type: cos_sim_pearson
1972
  value: 28.364293841556304
@@ -1983,6 +2044,7 @@ model-index:
1983
  name: MTEB TRECCOVID
1984
  config: default
1985
  split: test
 
1986
  metrics:
1987
  - type: map_at_1
1988
  value: 0.19499999999999998
@@ -2039,6 +2101,7 @@ model-index:
2039
  name: MTEB Touche2020
2040
  config: default
2041
  split: test
 
2042
  metrics:
2043
  - type: map_at_1
2044
  value: 1.997
@@ -2095,6 +2158,7 @@ model-index:
2095
  name: MTEB ToxicConversationsClassification
2096
  config: default
2097
  split: test
 
2098
  metrics:
2099
  - type: accuracy
2100
  value: 60.861200000000004
@@ -2109,6 +2173,7 @@ model-index:
2109
  name: MTEB TweetSentimentExtractionClassification
2110
  config: default
2111
  split: test
 
2112
  metrics:
2113
  - type: accuracy
2114
  value: 55.464063384267114
@@ -2121,6 +2186,7 @@ model-index:
2121
  name: MTEB TwentyNewsgroupsClustering
2122
  config: default
2123
  split: test
 
2124
  metrics:
2125
  - type: v_measure
2126
  value: 49.74455348083809
@@ -2131,6 +2197,7 @@ model-index:
2131
  name: MTEB TwitterSemEval2015
2132
  config: default
2133
  split: test
 
2134
  metrics:
2135
  - type: cos_sim_accuracy
2136
  value: 86.07617571675507
@@ -2185,6 +2252,7 @@ model-index:
2185
  name: MTEB TwitterURLCorpus
2186
  config: default
2187
  split: test
 
2188
  metrics:
2189
  - type: cos_sim_accuracy
2190
  value: 88.51631932316529
 
39
  name: MTEB AmazonCounterfactualClassification (en)
40
  config: en
41
  split: test
42
+ revision: 2d8a100785abf0ae21420d2a55b0c56e3e1ea996
43
  metrics:
44
  - type: accuracy
45
  value: 65.26865671641791
 
54
  name: MTEB AmazonPolarityClassification
55
  config: default
56
  split: test
57
+ revision: 80714f8dcf8cefc218ef4f8c5a966dd83f75a0e1
58
  metrics:
59
  - type: accuracy
60
  value: 67.13145
 
69
  name: MTEB AmazonReviewsClassification (en)
70
  config: en
71
  split: test
72
+ revision: c379a6705fec24a2493fa68e011692605f44e119
73
  metrics:
74
  - type: accuracy
75
  value: 31.920000000000005
 
82
  name: MTEB ArguAna
83
  config: default
84
  split: test
85
+ revision: 5b3e3697907184a9b77a3c99ee9ea1a9cbb1e4e3
86
  metrics:
87
  - type: map_at_1
88
  value: 23.186
 
139
  name: MTEB ArxivClusteringP2P
140
  config: default
141
  split: test
142
+ revision: 0bbdb47bcbe3a90093699aefeed338a0f28a7ee8
143
  metrics:
144
  - type: v_measure
145
  value: 48.37886340922374
 
150
  name: MTEB ArxivClusteringS2S
151
  config: default
152
  split: test
153
+ revision: b73bd54100e5abfa6e3a23dcafb46fe4d2438dc3
154
  metrics:
155
  - type: v_measure
156
  value: 39.72488615315985
 
161
  name: MTEB AskUbuntuDupQuestions
162
  config: default
163
  split: test
164
+ revision: 4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c
165
  metrics:
166
  - type: map
167
  value: 65.85199009344481
 
174
  name: MTEB BIOSSES
175
  config: default
176
  split: test
177
+ revision: 9ee918f184421b6bd48b78f6c714d86546106103
178
  metrics:
179
  - type: cos_sim_pearson
180
  value: 84.47737119217858
 
195
  name: MTEB Banking77Classification
196
  config: default
197
  split: test
198
+ revision: 44fa15921b4c889113cc5df03dd4901b49161ab7
199
  metrics:
200
  - type: accuracy
201
  value: 81.8603896103896
 
208
  name: MTEB BiorxivClusteringP2P
209
  config: default
210
  split: test
211
+ revision: 11d0121201d1f1f280e8cc8f3d98fb9c4d9f9c55
212
  metrics:
213
  - type: v_measure
214
  value: 39.616605133625185
 
219
  name: MTEB BiorxivClusteringS2S
220
  config: default
221
  split: test
222
+ revision: c0fab014e1bcb8d3a5e31b2088972a1e01547dc1
223
  metrics:
224
  - type: v_measure
225
  value: 35.02442407186902
 
230
  name: MTEB CQADupstackAndroidRetrieval
231
  config: default
232
  split: test
233
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
234
  metrics:
235
  - type: map_at_1
236
  value: 36.036
 
287
  name: MTEB CQADupstackEnglishRetrieval
288
  config: default
289
  split: test
290
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
291
  metrics:
292
  - type: map_at_1
293
  value: 32.92
 
344
  name: MTEB CQADupstackGamingRetrieval
345
  config: default
346
  split: test
347
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
348
  metrics:
349
  - type: map_at_1
350
  value: 40.695
 
401
  name: MTEB CQADupstackGisRetrieval
402
  config: default
403
  split: test
404
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
405
  metrics:
406
  - type: map_at_1
407
  value: 29.024
 
458
  name: MTEB CQADupstackMathematicaRetrieval
459
  config: default
460
  split: test
461
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
462
  metrics:
463
  - type: map_at_1
464
  value: 17.774
 
515
  name: MTEB CQADupstackPhysicsRetrieval
516
  config: default
517
  split: test
518
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
519
  metrics:
520
  - type: map_at_1
521
  value: 31.885
 
572
  name: MTEB CQADupstackProgrammersRetrieval
573
  config: default
574
  split: test
575
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
576
  metrics:
577
  - type: map_at_1
578
  value: 26.454
 
629
  name: MTEB CQADupstackRetrieval
630
  config: default
631
  split: test
632
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
633
  metrics:
634
  - type: map_at_1
635
  value: 27.743666666666666
 
686
  name: MTEB CQADupstackStatsRetrieval
687
  config: default
688
  split: test
689
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
690
  metrics:
691
  - type: map_at_1
692
  value: 25.244
 
743
  name: MTEB CQADupstackTexRetrieval
744
  config: default
745
  split: test
746
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
747
  metrics:
748
  - type: map_at_1
749
  value: 18.857
 
800
  name: MTEB CQADupstackUnixRetrieval
801
  config: default
802
  split: test
803
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
804
  metrics:
805
  - type: map_at_1
806
  value: 27.486
 
857
  name: MTEB CQADupstackWebmastersRetrieval
858
  config: default
859
  split: test
860
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
861
  metrics:
862
  - type: map_at_1
863
  value: 26.207
 
914
  name: MTEB CQADupstackWordpressRetrieval
915
  config: default
916
  split: test
917
+ revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
918
  metrics:
919
  - type: map_at_1
920
  value: 20.342
 
971
  name: MTEB ClimateFEVER
972
  config: default
973
  split: test
974
+ revision: 392b78eb68c07badcd7c2cd8f39af108375dfcce
975
  metrics:
976
  - type: map_at_1
977
  value: 7.71
 
1028
  name: MTEB DBPedia
1029
  config: default
1030
  split: test
1031
+ revision: f097057d03ed98220bc7309ddb10b71a54d667d6
1032
  metrics:
1033
  - type: map_at_1
1034
  value: 6.8180000000000005
 
1085
  name: MTEB EmotionClassification
1086
  config: default
1087
  split: test
1088
+ revision: 829147f8f75a25f005913200eb5ed41fae320aa1
1089
  metrics:
1090
  - type: accuracy
1091
  value: 39.725
 
1098
  name: MTEB FEVER
1099
  config: default
1100
  split: test
1101
+ revision: 1429cf27e393599b8b359b9b72c666f96b2525f9
1102
  metrics:
1103
  - type: map_at_1
1104
  value: 31.901000000000003
 
1155
  name: MTEB FiQA2018
1156
  config: default
1157
  split: test
1158
+ revision: 41b686a7f28c59bcaaa5791efd47c67c8ebe28be
1159
  metrics:
1160
  - type: map_at_1
1161
  value: 24.4
 
1212
  name: MTEB HotpotQA
1213
  config: default
1214
  split: test
1215
+ revision: 766870b35a1b9ca65e67a0d1913899973551fc6c
1216
  metrics:
1217
  - type: map_at_1
1218
  value: 22.262
 
1269
  name: MTEB ImdbClassification
1270
  config: default
1271
  split: test
1272
+ revision: 8d743909f834c38949e8323a8a6ce8721ea6c7f4
1273
  metrics:
1274
  - type: accuracy
1275
  value: 70.7156
 
1284
  name: MTEB MSMARCO
1285
  config: default
1286
  split: dev
1287
+ revision: e6838a846e2408f22cf5cc337ebc83e0bcf77849
1288
  metrics:
1289
  - type: map_at_1
1290
  value: 21.174
 
1341
  name: MTEB MTOPDomainClassification (en)
1342
  config: en
1343
  split: test
1344
+ revision: a7e2a951126a26fc8c6a69f835f33a346ba259e3
1345
  metrics:
1346
  - type: accuracy
1347
  value: 92.07934336525308
 
1354
  name: MTEB MTOPIntentClassification (en)
1355
  config: en
1356
  split: test
1357
+ revision: 6299947a7777084cc2d4b64235bf7190381ce755
1358
  metrics:
1359
  - type: accuracy
1360
  value: 70.20975832193344
 
1367
  name: MTEB MassiveIntentClassification (en)
1368
  config: en
1369
  split: test
1370
+ revision: 072a486a144adf7f4479a4a0dddb2152e161e1ea
1371
  metrics:
1372
  - type: accuracy
1373
  value: 69.56624075319435
 
1380
  name: MTEB MassiveScenarioClassification (en)
1381
  config: en
1382
  split: test
1383
+ revision: 7d571f92784cd94a019292a1f45445077d0ef634
1384
  metrics:
1385
  - type: accuracy
1386
  value: 76.01210490921318
 
1393
  name: MTEB MedrxivClusteringP2P
1394
  config: default
1395
  split: test
1396
+ revision: dcefc037ef84348e49b0d29109e891c01067226b
1397
  metrics:
1398
  - type: v_measure
1399
  value: 35.58002813186373
 
1404
  name: MTEB MedrxivClusteringS2S
1405
  config: default
1406
  split: test
1407
+ revision: 3cd0e71dfbe09d4de0f9e5ecba43e7ce280959dc
1408
  metrics:
1409
  - type: v_measure
1410
  value: 32.872725562410444
 
1415
  name: MTEB MindSmallReranking
1416
  config: default
1417
  split: test
1418
+ revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
1419
  metrics:
1420
  - type: map
1421
  value: 30.965343604861328
 
1428
  name: MTEB NFCorpus
1429
  config: default
1430
  split: test
1431
+ revision: 7eb63cc0c1eb59324d709ebed25fcab851fa7610
1432
  metrics:
1433
  - type: map_at_1
1434
  value: 4.938
 
1485
  name: MTEB NQ
1486
  config: default
1487
  split: test
1488
+ revision: 6062aefc120bfe8ece5897809fb2e53bfe0d128c
1489
  metrics:
1490
  - type: map_at_1
1491
  value: 27.124
 
1542
  name: MTEB QuoraRetrieval
1543
  config: default
1544
  split: test
1545
+ revision: 6205996560df11e3a3da9ab4f926788fc30a7db4
1546
  metrics:
1547
  - type: map_at_1
1548
  value: 69.33500000000001
 
1599
  name: MTEB RedditClustering
1600
  config: default
1601
  split: test
1602
+ revision: b2805658ae38990172679479369a78b86de8c390
1603
  metrics:
1604
  - type: v_measure
1605
  value: 54.824256698437324
 
1610
  name: MTEB RedditClusteringP2P
1611
  config: default
1612
  split: test
1613
+ revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
1614
  metrics:
1615
  - type: v_measure
1616
  value: 56.768972678049366
 
1621
  name: MTEB SCIDOCS
1622
  config: default
1623
  split: test
1624
+ revision: 5c59ef3e437a0a9651c8fe6fde943e7dce59fba5
1625
  metrics:
1626
  - type: map_at_1
1627
  value: 5.192
 
1678
  name: MTEB SICK-R
1679
  config: default
1680
  split: test
1681
+ revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
1682
  metrics:
1683
  - type: cos_sim_pearson
1684
  value: 84.00280838354293
 
1699
  name: MTEB STS12
1700
  config: default
1701
  split: test
1702
+ revision: fdf84275bb8ce4b49c971d02e84dd1abc677a50f
1703
  metrics:
1704
  - type: cos_sim_pearson
1705
  value: 83.2801353818369
 
1720
  name: MTEB STS13
1721
  config: default
1722
  split: test
1723
+ revision: 1591bfcbe8c69d4bf7fe2a16e2451017832cafb9
1724
  metrics:
1725
  - type: cos_sim_pearson
1726
  value: 83.20700572036095
 
1741
  name: MTEB STS14
1742
  config: default
1743
  split: test
1744
+ revision: e2125984e7df8b7871f6ae9949cf6b6795e7c54b
1745
  metrics:
1746
  - type: cos_sim_pearson
1747
  value: 82.27113025749529
 
1762
  name: MTEB STS15
1763
  config: default
1764
  split: test
1765
+ revision: 1cd7298cac12a96a373b6a2f18738bb3e739a9b6
1766
  metrics:
1767
  - type: cos_sim_pearson
1768
  value: 84.98824030948605
 
1783
  name: MTEB STS16
1784
  config: default
1785
  split: test
1786
+ revision: 360a0b2dff98700d09e634a01e1cc1624d3e42cd
1787
  metrics:
1788
  - type: cos_sim_pearson
1789
  value: 78.82478639193744
 
1804
  name: MTEB STS17 (en-en)
1805
  config: en-en
1806
  split: test
1807
+ revision: 9fc37e8c632af1c87a3d23e685d49552a02582a0
1808
  metrics:
1809
  - type: cos_sim_pearson
1810
  value: 90.90804154377126
 
1825
  name: MTEB STS22 (en)
1826
  config: en
1827
  split: test
1828
+ revision: 2de6ce8c1921b71a755b262c6b57fef195dd7906
1829
  metrics:
1830
  - type: cos_sim_pearson
1831
  value: 66.78771571400975
 
1846
  name: MTEB STSBenchmark
1847
  config: default
1848
  split: test
1849
+ revision: 8913289635987208e6e7c72789e4be2fe94b6abd
1850
  metrics:
1851
  - type: cos_sim_pearson
1852
  value: 84.03996099800993
 
1867
  name: MTEB SciDocsRR
1868
  config: default
1869
  split: test
1870
+ revision: 56a6d0140cf6356659e2a7c1413286a774468d44
1871
  metrics:
1872
  - type: map
1873
  value: 88.65396986895777
 
1880
  name: MTEB SciFact
1881
  config: default
1882
  split: test
1883
+ revision: a75ae049398addde9b70f6b268875f5cbce99089
1884
  metrics:
1885
  - type: map_at_1
1886
  value: 51.456
 
1937
  name: MTEB SprintDuplicateQuestions
1938
  config: default
1939
  split: test
1940
+ revision: 5a8256d0dff9c4bd3be3ba3e67e4e70173f802ea
1941
  metrics:
1942
  - type: cos_sim_accuracy
1943
  value: 99.65940594059406
 
1992
  name: MTEB StackExchangeClustering
1993
  config: default
1994
  split: test
1995
+ revision: 70a89468f6dccacc6aa2b12a6eac54e74328f235
1996
  metrics:
1997
  - type: v_measure
1998
  value: 53.80048409076929
 
2003
  name: MTEB StackExchangeClusteringP2P
2004
  config: default
2005
  split: test
2006
+ revision: d88009ab563dd0b16cfaf4436abaf97fa3550cf0
2007
  metrics:
2008
  - type: v_measure
2009
  value: 34.280269334397545
 
2014
  name: MTEB StackOverflowDupQuestions
2015
  config: default
2016
  split: test
2017
+ revision: ef807ea29a75ec4f91b50fd4191cb4ee4589a9f9
2018
  metrics:
2019
  - type: map
2020
  value: 51.97907654945493
 
2027
  name: MTEB SummEval
2028
  config: default
2029
  split: test
2030
+ revision: 8753c2788d36c01fc6f05d03fe3f7268d63f9122
2031
  metrics:
2032
  - type: cos_sim_pearson
2033
  value: 28.364293841556304
 
2044
  name: MTEB TRECCOVID
2045
  config: default
2046
  split: test
2047
+ revision: 2c8041b2c07a79b6f7ba8fe6acc72e5d9f92d217
2048
  metrics:
2049
  - type: map_at_1
2050
  value: 0.19499999999999998
 
2101
  name: MTEB Touche2020
2102
  config: default
2103
  split: test
2104
+ revision: 527b7d77e16e343303e68cb6af11d6e18b9f7b3b
2105
  metrics:
2106
  - type: map_at_1
2107
  value: 1.997
 
2158
  name: MTEB ToxicConversationsClassification
2159
  config: default
2160
  split: test
2161
+ revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
2162
  metrics:
2163
  - type: accuracy
2164
  value: 60.861200000000004
 
2173
  name: MTEB TweetSentimentExtractionClassification
2174
  config: default
2175
  split: test
2176
+ revision: 62146448f05be9e52a36b8ee9936447ea787eede
2177
  metrics:
2178
  - type: accuracy
2179
  value: 55.464063384267114
 
2186
  name: MTEB TwentyNewsgroupsClustering
2187
  config: default
2188
  split: test
2189
+ revision: 091a54f9a36281ce7d6590ec8c75dd485e7e01d4
2190
  metrics:
2191
  - type: v_measure
2192
  value: 49.74455348083809
 
2197
  name: MTEB TwitterSemEval2015
2198
  config: default
2199
  split: test
2200
+ revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
2201
  metrics:
2202
  - type: cos_sim_accuracy
2203
  value: 86.07617571675507
 
2252
  name: MTEB TwitterURLCorpus
2253
  config: default
2254
  split: test
2255
+ revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
2256
  metrics:
2257
  - type: cos_sim_accuracy
2258
  value: 88.51631932316529