matyaydin commited on
Commit
9914bff
·
verified ·
1 Parent(s): cd33264

Upload tokenizer

Browse files
Files changed (1) hide show
  1. README.md +59 -167
README.md CHANGED
@@ -5,14 +5,17 @@ tags:
5
  - sentence-similarity
6
  - transformers
7
  - mteb
 
 
 
8
  model-index:
9
  - name: bge-base-en-v1.5
10
  results:
11
  - task:
12
  type: Classification
13
  dataset:
14
- type: mteb/amazon_counterfactual
15
  name: MTEB AmazonCounterfactualClassification (en)
 
16
  config: en
17
  split: test
18
  revision: e8379541af4e31359cca9fbcf4b00f2671dba205
@@ -26,8 +29,8 @@ model-index:
26
  - task:
27
  type: Classification
28
  dataset:
29
- type: mteb/amazon_polarity
30
  name: MTEB AmazonPolarityClassification
 
31
  config: default
32
  split: test
33
  revision: e2d317d38cd51312af73b3d32a06d1a08b442046
@@ -41,8 +44,8 @@ model-index:
41
  - task:
42
  type: Classification
43
  dataset:
44
- type: mteb/amazon_reviews_multi
45
  name: MTEB AmazonReviewsClassification (en)
 
46
  config: en
47
  split: test
48
  revision: 1399c76144fd37290681b995c656ef9b2e06e26d
@@ -54,8 +57,8 @@ model-index:
54
  - task:
55
  type: Retrieval
56
  dataset:
57
- type: arguana
58
  name: MTEB ArguAna
 
59
  config: default
60
  split: test
61
  revision: None
@@ -123,8 +126,8 @@ model-index:
123
  - task:
124
  type: Clustering
125
  dataset:
126
- type: mteb/arxiv-clustering-p2p
127
  name: MTEB ArxivClusteringP2P
 
128
  config: default
129
  split: test
130
  revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
@@ -134,8 +137,8 @@ model-index:
134
  - task:
135
  type: Clustering
136
  dataset:
137
- type: mteb/arxiv-clustering-s2s
138
  name: MTEB ArxivClusteringS2S
 
139
  config: default
140
  split: test
141
  revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
@@ -145,8 +148,8 @@ model-index:
145
  - task:
146
  type: Reranking
147
  dataset:
148
- type: mteb/askubuntudupquestions-reranking
149
  name: MTEB AskUbuntuDupQuestions
 
150
  config: default
151
  split: test
152
  revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
@@ -158,8 +161,8 @@ model-index:
158
  - task:
159
  type: STS
160
  dataset:
161
- type: mteb/biosses-sts
162
  name: MTEB BIOSSES
 
163
  config: default
164
  split: test
165
  revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
@@ -179,8 +182,8 @@ model-index:
179
  - task:
180
  type: Classification
181
  dataset:
182
- type: mteb/banking77
183
  name: MTEB Banking77Classification
 
184
  config: default
185
  split: test
186
  revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
@@ -192,8 +195,8 @@ model-index:
192
  - task:
193
  type: Clustering
194
  dataset:
195
- type: mteb/biorxiv-clustering-p2p
196
  name: MTEB BiorxivClusteringP2P
 
197
  config: default
198
  split: test
199
  revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
@@ -203,8 +206,8 @@ model-index:
203
  - task:
204
  type: Clustering
205
  dataset:
206
- type: mteb/biorxiv-clustering-s2s
207
  name: MTEB BiorxivClusteringS2S
 
208
  config: default
209
  split: test
210
  revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
@@ -214,8 +217,8 @@ model-index:
214
  - task:
215
  type: Retrieval
216
  dataset:
217
- type: BeIR/cqadupstack
218
  name: MTEB CQADupstackAndroidRetrieval
 
219
  config: default
220
  split: test
221
  revision: None
@@ -280,15 +283,6 @@ model-index:
280
  value: 48.065000000000005
281
  - type: recall_at_5
282
  value: 54.519
283
- - task:
284
- type: Retrieval
285
- dataset:
286
- type: BeIR/cqadupstack
287
- name: MTEB CQADupstackEnglishRetrieval
288
- config: default
289
- split: test
290
- revision: None
291
- metrics:
292
  - type: map_at_1
293
  value: 32.671
294
  - type: map_at_10
@@ -349,15 +343,6 @@ model-index:
349
  value: 45.626
350
  - type: recall_at_5
351
  value: 51.812000000000005
352
- - task:
353
- type: Retrieval
354
- dataset:
355
- type: BeIR/cqadupstack
356
- name: MTEB CQADupstackGamingRetrieval
357
- config: default
358
- split: test
359
- revision: None
360
- metrics:
361
  - type: map_at_1
362
  value: 41.185
363
  - type: map_at_10
@@ -418,15 +403,6 @@ model-index:
418
  value: 59.199999999999996
419
  - type: recall_at_5
420
  value: 66.118
421
- - task:
422
- type: Retrieval
423
- dataset:
424
- type: BeIR/cqadupstack
425
- name: MTEB CQADupstackGisRetrieval
426
- config: default
427
- split: test
428
- revision: None
429
- metrics:
430
  - type: map_at_1
431
  value: 27.27
432
  - type: map_at_10
@@ -487,15 +463,6 @@ model-index:
487
  value: 40.974
488
  - type: recall_at_5
489
  value: 47.327000000000005
490
- - task:
491
- type: Retrieval
492
- dataset:
493
- type: BeIR/cqadupstack
494
- name: MTEB CQADupstackMathematicaRetrieval
495
- config: default
496
- split: test
497
- revision: None
498
- metrics:
499
  - type: map_at_1
500
  value: 17.848
501
  - type: map_at_10
@@ -556,15 +523,6 @@ model-index:
556
  value: 29.18
557
  - type: recall_at_5
558
  value: 35.347
559
- - task:
560
- type: Retrieval
561
- dataset:
562
- type: BeIR/cqadupstack
563
- name: MTEB CQADupstackPhysicsRetrieval
564
- config: default
565
- split: test
566
- revision: None
567
- metrics:
568
  - type: map_at_1
569
  value: 30.94
570
  - type: map_at_10
@@ -625,15 +583,6 @@ model-index:
625
  value: 44.712
626
  - type: recall_at_5
627
  value: 51.932
628
- - task:
629
- type: Retrieval
630
- dataset:
631
- type: BeIR/cqadupstack
632
- name: MTEB CQADupstackProgrammersRetrieval
633
- config: default
634
- split: test
635
- revision: None
636
- metrics:
637
  - type: map_at_1
638
  value: 27.104
639
  - type: map_at_10
@@ -694,15 +643,6 @@ model-index:
694
  value: 39.92
695
  - type: recall_at_5
696
  value: 45.457
697
- - task:
698
- type: Retrieval
699
- dataset:
700
- type: BeIR/cqadupstack
701
- name: MTEB CQADupstackRetrieval
702
- config: default
703
- split: test
704
- revision: None
705
- metrics:
706
  - type: map_at_1
707
  value: 27.707749999999997
708
  - type: map_at_10
@@ -763,15 +703,6 @@ model-index:
763
  value: 40.39083333333334
764
  - type: recall_at_5
765
  value: 46.40083333333333
766
- - task:
767
- type: Retrieval
768
- dataset:
769
- type: BeIR/cqadupstack
770
- name: MTEB CQADupstackStatsRetrieval
771
- config: default
772
- split: test
773
- revision: None
774
- metrics:
775
  - type: map_at_1
776
  value: 26.482
777
  - type: map_at_10
@@ -832,15 +763,6 @@ model-index:
832
  value: 36.65
833
  - type: recall_at_5
834
  value: 40.774
835
- - task:
836
- type: Retrieval
837
- dataset:
838
- type: BeIR/cqadupstack
839
- name: MTEB CQADupstackTexRetrieval
840
- config: default
841
- split: test
842
- revision: None
843
- metrics:
844
  - type: map_at_1
845
  value: 18.815
846
  - type: map_at_10
@@ -901,15 +823,6 @@ model-index:
901
  value: 29.694
902
  - type: recall_at_5
903
  value: 34.935
904
- - task:
905
- type: Retrieval
906
- dataset:
907
- type: BeIR/cqadupstack
908
- name: MTEB CQADupstackUnixRetrieval
909
- config: default
910
- split: test
911
- revision: None
912
- metrics:
913
  - type: map_at_1
914
  value: 27.840999999999998
915
  - type: map_at_10
@@ -970,15 +883,6 @@ model-index:
970
  value: 40.146
971
  - type: recall_at_5
972
  value: 44.951
973
- - task:
974
- type: Retrieval
975
- dataset:
976
- type: BeIR/cqadupstack
977
- name: MTEB CQADupstackWebmastersRetrieval
978
- config: default
979
- split: test
980
- revision: None
981
- metrics:
982
  - type: map_at_1
983
  value: 26.529000000000003
984
  - type: map_at_10
@@ -1039,15 +943,6 @@ model-index:
1039
  value: 36.986000000000004
1040
  - type: recall_at_5
1041
  value: 43.096000000000004
1042
- - task:
1043
- type: Retrieval
1044
- dataset:
1045
- type: BeIR/cqadupstack
1046
- name: MTEB CQADupstackWordpressRetrieval
1047
- config: default
1048
- split: test
1049
- revision: None
1050
- metrics:
1051
  - type: map_at_1
1052
  value: 23.480999999999998
1053
  - type: map_at_10
@@ -1111,8 +1006,8 @@ model-index:
1111
  - task:
1112
  type: Retrieval
1113
  dataset:
1114
- type: climate-fever
1115
  name: MTEB ClimateFEVER
 
1116
  config: default
1117
  split: test
1118
  revision: None
@@ -1180,8 +1075,8 @@ model-index:
1180
  - task:
1181
  type: Retrieval
1182
  dataset:
1183
- type: dbpedia-entity
1184
  name: MTEB DBPedia
 
1185
  config: default
1186
  split: test
1187
  revision: None
@@ -1249,8 +1144,8 @@ model-index:
1249
  - task:
1250
  type: Classification
1251
  dataset:
1252
- type: mteb/emotion
1253
  name: MTEB EmotionClassification
 
1254
  config: default
1255
  split: test
1256
  revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
@@ -1262,8 +1157,8 @@ model-index:
1262
  - task:
1263
  type: Retrieval
1264
  dataset:
1265
- type: fever
1266
  name: MTEB FEVER
 
1267
  config: default
1268
  split: test
1269
  revision: None
@@ -1331,8 +1226,8 @@ model-index:
1331
  - task:
1332
  type: Retrieval
1333
  dataset:
1334
- type: fiqa
1335
  name: MTEB FiQA2018
 
1336
  config: default
1337
  split: test
1338
  revision: None
@@ -1400,8 +1295,8 @@ model-index:
1400
  - task:
1401
  type: Retrieval
1402
  dataset:
1403
- type: hotpotqa
1404
  name: MTEB HotpotQA
 
1405
  config: default
1406
  split: test
1407
  revision: None
@@ -1469,8 +1364,8 @@ model-index:
1469
  - task:
1470
  type: Classification
1471
  dataset:
1472
- type: mteb/imdb
1473
  name: MTEB ImdbClassification
 
1474
  config: default
1475
  split: test
1476
  revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
@@ -1484,8 +1379,8 @@ model-index:
1484
  - task:
1485
  type: Retrieval
1486
  dataset:
1487
- type: msmarco
1488
  name: MTEB MSMARCO
 
1489
  config: default
1490
  split: dev
1491
  revision: None
@@ -1553,8 +1448,8 @@ model-index:
1553
  - task:
1554
  type: Classification
1555
  dataset:
1556
- type: mteb/mtop_domain
1557
  name: MTEB MTOPDomainClassification (en)
 
1558
  config: en
1559
  split: test
1560
  revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
@@ -1566,8 +1461,8 @@ model-index:
1566
  - task:
1567
  type: Classification
1568
  dataset:
1569
- type: mteb/mtop_intent
1570
  name: MTEB MTOPIntentClassification (en)
 
1571
  config: en
1572
  split: test
1573
  revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
@@ -1579,8 +1474,8 @@ model-index:
1579
  - task:
1580
  type: Classification
1581
  dataset:
1582
- type: mteb/amazon_massive_intent
1583
  name: MTEB MassiveIntentClassification (en)
 
1584
  config: en
1585
  split: test
1586
  revision: 31efe3c427b0bae9c22cbb560b8f15491cc6bed7
@@ -1592,8 +1487,8 @@ model-index:
1592
  - task:
1593
  type: Classification
1594
  dataset:
1595
- type: mteb/amazon_massive_scenario
1596
  name: MTEB MassiveScenarioClassification (en)
 
1597
  config: en
1598
  split: test
1599
  revision: 7d571f92784cd94a019292a1f45445077d0ef634
@@ -1605,8 +1500,8 @@ model-index:
1605
  - task:
1606
  type: Clustering
1607
  dataset:
1608
- type: mteb/medrxiv-clustering-p2p
1609
  name: MTEB MedrxivClusteringP2P
 
1610
  config: default
1611
  split: test
1612
  revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
@@ -1616,8 +1511,8 @@ model-index:
1616
  - task:
1617
  type: Clustering
1618
  dataset:
1619
- type: mteb/medrxiv-clustering-s2s
1620
  name: MTEB MedrxivClusteringS2S
 
1621
  config: default
1622
  split: test
1623
  revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
@@ -1627,8 +1522,8 @@ model-index:
1627
  - task:
1628
  type: Reranking
1629
  dataset:
1630
- type: mteb/mind_small
1631
  name: MTEB MindSmallReranking
 
1632
  config: default
1633
  split: test
1634
  revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
@@ -1640,8 +1535,8 @@ model-index:
1640
  - task:
1641
  type: Retrieval
1642
  dataset:
1643
- type: nfcorpus
1644
  name: MTEB NFCorpus
 
1645
  config: default
1646
  split: test
1647
  revision: None
@@ -1709,8 +1604,8 @@ model-index:
1709
  - task:
1710
  type: Retrieval
1711
  dataset:
1712
- type: nq
1713
  name: MTEB NQ
 
1714
  config: default
1715
  split: test
1716
  revision: None
@@ -1778,8 +1673,8 @@ model-index:
1778
  - task:
1779
  type: Retrieval
1780
  dataset:
1781
- type: quora
1782
  name: MTEB QuoraRetrieval
 
1783
  config: default
1784
  split: test
1785
  revision: None
@@ -1847,8 +1742,8 @@ model-index:
1847
  - task:
1848
  type: Clustering
1849
  dataset:
1850
- type: mteb/reddit-clustering
1851
  name: MTEB RedditClustering
 
1852
  config: default
1853
  split: test
1854
  revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
@@ -1858,8 +1753,8 @@ model-index:
1858
  - task:
1859
  type: Clustering
1860
  dataset:
1861
- type: mteb/reddit-clustering-p2p
1862
  name: MTEB RedditClusteringP2P
 
1863
  config: default
1864
  split: test
1865
  revision: 282350215ef01743dc01b456c7f5241fa8937f16
@@ -1869,8 +1764,8 @@ model-index:
1869
  - task:
1870
  type: Retrieval
1871
  dataset:
1872
- type: scidocs
1873
  name: MTEB SCIDOCS
 
1874
  config: default
1875
  split: test
1876
  revision: None
@@ -1938,8 +1833,8 @@ model-index:
1938
  - task:
1939
  type: STS
1940
  dataset:
1941
- type: mteb/sickr-sts
1942
  name: MTEB SICK-R
 
1943
  config: default
1944
  split: test
1945
  revision: a6ea5a8cab320b040a23452cc28066d9beae2cee
@@ -1959,8 +1854,8 @@ model-index:
1959
  - task:
1960
  type: STS
1961
  dataset:
1962
- type: mteb/sts12-sts
1963
  name: MTEB STS12
 
1964
  config: default
1965
  split: test
1966
  revision: a0d554a64d88156834ff5ae9920b964011b16384
@@ -1980,8 +1875,8 @@ model-index:
1980
  - task:
1981
  type: STS
1982
  dataset:
1983
- type: mteb/sts13-sts
1984
  name: MTEB STS13
 
1985
  config: default
1986
  split: test
1987
  revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
@@ -2001,8 +1896,8 @@ model-index:
2001
  - task:
2002
  type: STS
2003
  dataset:
2004
- type: mteb/sts14-sts
2005
  name: MTEB STS14
 
2006
  config: default
2007
  split: test
2008
  revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
@@ -2022,8 +1917,8 @@ model-index:
2022
  - task:
2023
  type: STS
2024
  dataset:
2025
- type: mteb/sts15-sts
2026
  name: MTEB STS15
 
2027
  config: default
2028
  split: test
2029
  revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
@@ -2043,8 +1938,8 @@ model-index:
2043
  - task:
2044
  type: STS
2045
  dataset:
2046
- type: mteb/sts16-sts
2047
  name: MTEB STS16
 
2048
  config: default
2049
  split: test
2050
  revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
@@ -2064,8 +1959,8 @@ model-index:
2064
  - task:
2065
  type: STS
2066
  dataset:
2067
- type: mteb/sts17-crosslingual-sts
2068
  name: MTEB STS17 (en-en)
 
2069
  config: en-en
2070
  split: test
2071
  revision: af5e6fb845001ecf41f4c1e033ce921939a2a68d
@@ -2085,8 +1980,8 @@ model-index:
2085
  - task:
2086
  type: STS
2087
  dataset:
2088
- type: mteb/sts22-crosslingual-sts
2089
  name: MTEB STS22 (en)
 
2090
  config: en
2091
  split: test
2092
  revision: 6d1ba47164174a496b7fa5d3569dae26a6813b80
@@ -2106,8 +2001,8 @@ model-index:
2106
  - task:
2107
  type: STS
2108
  dataset:
2109
- type: mteb/stsbenchmark-sts
2110
  name: MTEB STSBenchmark
 
2111
  config: default
2112
  split: test
2113
  revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
@@ -2127,8 +2022,8 @@ model-index:
2127
  - task:
2128
  type: Reranking
2129
  dataset:
2130
- type: mteb/scidocs-reranking
2131
  name: MTEB SciDocsRR
 
2132
  config: default
2133
  split: test
2134
  revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
@@ -2140,8 +2035,8 @@ model-index:
2140
  - task:
2141
  type: Retrieval
2142
  dataset:
2143
- type: scifact
2144
  name: MTEB SciFact
 
2145
  config: default
2146
  split: test
2147
  revision: None
@@ -2209,8 +2104,8 @@ model-index:
2209
  - task:
2210
  type: PairClassification
2211
  dataset:
2212
- type: mteb/sprintduplicatequestions-pairclassification
2213
  name: MTEB SprintDuplicateQuestions
 
2214
  config: default
2215
  split: test
2216
  revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
@@ -2264,8 +2159,8 @@ model-index:
2264
  - task:
2265
  type: Clustering
2266
  dataset:
2267
- type: mteb/stackexchange-clustering
2268
  name: MTEB StackExchangeClustering
 
2269
  config: default
2270
  split: test
2271
  revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
@@ -2275,8 +2170,8 @@ model-index:
2275
  - task:
2276
  type: Clustering
2277
  dataset:
2278
- type: mteb/stackexchange-clustering-p2p
2279
  name: MTEB StackExchangeClusteringP2P
 
2280
  config: default
2281
  split: test
2282
  revision: 815ca46b2622cec33ccafc3735d572c266efdb44
@@ -2286,8 +2181,8 @@ model-index:
2286
  - task:
2287
  type: Reranking
2288
  dataset:
2289
- type: mteb/stackoverflowdupquestions-reranking
2290
  name: MTEB StackOverflowDupQuestions
 
2291
  config: default
2292
  split: test
2293
  revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
@@ -2299,8 +2194,8 @@ model-index:
2299
  - task:
2300
  type: Summarization
2301
  dataset:
2302
- type: mteb/summeval
2303
  name: MTEB SummEval
 
2304
  config: default
2305
  split: test
2306
  revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
@@ -2316,8 +2211,8 @@ model-index:
2316
  - task:
2317
  type: Retrieval
2318
  dataset:
2319
- type: trec-covid
2320
  name: MTEB TRECCOVID
 
2321
  config: default
2322
  split: test
2323
  revision: None
@@ -2385,8 +2280,8 @@ model-index:
2385
  - task:
2386
  type: Retrieval
2387
  dataset:
2388
- type: webis-touche2020
2389
  name: MTEB Touche2020
 
2390
  config: default
2391
  split: test
2392
  revision: None
@@ -2454,8 +2349,8 @@ model-index:
2454
  - task:
2455
  type: Classification
2456
  dataset:
2457
- type: mteb/toxic_conversations_50k
2458
  name: MTEB ToxicConversationsClassification
 
2459
  config: default
2460
  split: test
2461
  revision: d7c0de2777da35d6aae2200a62c6e0e5af397c4c
@@ -2469,8 +2364,8 @@ model-index:
2469
  - task:
2470
  type: Classification
2471
  dataset:
2472
- type: mteb/tweet_sentiment_extraction
2473
  name: MTEB TweetSentimentExtractionClassification
 
2474
  config: default
2475
  split: test
2476
  revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
@@ -2482,8 +2377,8 @@ model-index:
2482
  - task:
2483
  type: Clustering
2484
  dataset:
2485
- type: mteb/twentynewsgroups-clustering
2486
  name: MTEB TwentyNewsgroupsClustering
 
2487
  config: default
2488
  split: test
2489
  revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
@@ -2493,8 +2388,8 @@ model-index:
2493
  - task:
2494
  type: PairClassification
2495
  dataset:
2496
- type: mteb/twittersemeval2015-pairclassification
2497
  name: MTEB TwitterSemEval2015
 
2498
  config: default
2499
  split: test
2500
  revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
@@ -2548,8 +2443,8 @@ model-index:
2548
  - task:
2549
  type: PairClassification
2550
  dataset:
2551
- type: mteb/twitterurlcorpus-pairclassification
2552
  name: MTEB TwitterURLCorpus
 
2553
  config: default
2554
  split: test
2555
  revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
@@ -2600,9 +2495,6 @@ model-index:
2600
  value: 85.64591703003417
2601
  - type: max_f1
2602
  value: 77.59531005352656
2603
- license: mit
2604
- language:
2605
- - en
2606
  ---
2607
 
2608
 
 
5
  - sentence-similarity
6
  - transformers
7
  - mteb
8
+ license: mit
9
+ language:
10
+ - en
11
  model-index:
12
  - name: bge-base-en-v1.5
13
  results:
14
  - task:
15
  type: Classification
16
  dataset:
 
17
  name: MTEB AmazonCounterfactualClassification (en)
18
+ type: mteb/amazon_counterfactual
19
  config: en
20
  split: test
21
  revision: e8379541af4e31359cca9fbcf4b00f2671dba205
 
29
  - task:
30
  type: Classification
31
  dataset:
 
32
  name: MTEB AmazonPolarityClassification
33
+ type: mteb/amazon_polarity
34
  config: default
35
  split: test
36
  revision: e2d317d38cd51312af73b3d32a06d1a08b442046
 
44
  - task:
45
  type: Classification
46
  dataset:
 
47
  name: MTEB AmazonReviewsClassification (en)
48
+ type: mteb/amazon_reviews_multi
49
  config: en
50
  split: test
51
  revision: 1399c76144fd37290681b995c656ef9b2e06e26d
 
57
  - task:
58
  type: Retrieval
59
  dataset:
 
60
  name: MTEB ArguAna
61
+ type: arguana
62
  config: default
63
  split: test
64
  revision: None
 
126
  - task:
127
  type: Clustering
128
  dataset:
 
129
  name: MTEB ArxivClusteringP2P
130
+ type: mteb/arxiv-clustering-p2p
131
  config: default
132
  split: test
133
  revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
 
137
  - task:
138
  type: Clustering
139
  dataset:
 
140
  name: MTEB ArxivClusteringS2S
141
+ type: mteb/arxiv-clustering-s2s
142
  config: default
143
  split: test
144
  revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
 
148
  - task:
149
  type: Reranking
150
  dataset:
 
151
  name: MTEB AskUbuntuDupQuestions
152
+ type: mteb/askubuntudupquestions-reranking
153
  config: default
154
  split: test
155
  revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
 
161
  - task:
162
  type: STS
163
  dataset:
 
164
  name: MTEB BIOSSES
165
+ type: mteb/biosses-sts
166
  config: default
167
  split: test
168
  revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
 
182
  - task:
183
  type: Classification
184
  dataset:
 
185
  name: MTEB Banking77Classification
186
+ type: mteb/banking77
187
  config: default
188
  split: test
189
  revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
 
195
  - task:
196
  type: Clustering
197
  dataset:
 
198
  name: MTEB BiorxivClusteringP2P
199
+ type: mteb/biorxiv-clustering-p2p
200
  config: default
201
  split: test
202
  revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
 
206
  - task:
207
  type: Clustering
208
  dataset:
 
209
  name: MTEB BiorxivClusteringS2S
210
+ type: mteb/biorxiv-clustering-s2s
211
  config: default
212
  split: test
213
  revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
 
217
  - task:
218
  type: Retrieval
219
  dataset:
 
220
  name: MTEB CQADupstackAndroidRetrieval
221
+ type: BeIR/cqadupstack
222
  config: default
223
  split: test
224
  revision: None
 
283
  value: 48.065000000000005
284
  - type: recall_at_5
285
  value: 54.519
 
 
 
 
 
 
 
 
 
286
  - type: map_at_1
287
  value: 32.671
288
  - type: map_at_10
 
343
  value: 45.626
344
  - type: recall_at_5
345
  value: 51.812000000000005
 
 
 
 
 
 
 
 
 
346
  - type: map_at_1
347
  value: 41.185
348
  - type: map_at_10
 
403
  value: 59.199999999999996
404
  - type: recall_at_5
405
  value: 66.118
 
 
 
 
 
 
 
 
 
406
  - type: map_at_1
407
  value: 27.27
408
  - type: map_at_10
 
463
  value: 40.974
464
  - type: recall_at_5
465
  value: 47.327000000000005
 
 
 
 
 
 
 
 
 
466
  - type: map_at_1
467
  value: 17.848
468
  - type: map_at_10
 
523
  value: 29.18
524
  - type: recall_at_5
525
  value: 35.347
 
 
 
 
 
 
 
 
 
526
  - type: map_at_1
527
  value: 30.94
528
  - type: map_at_10
 
583
  value: 44.712
584
  - type: recall_at_5
585
  value: 51.932
 
 
 
 
 
 
 
 
 
586
  - type: map_at_1
587
  value: 27.104
588
  - type: map_at_10
 
643
  value: 39.92
644
  - type: recall_at_5
645
  value: 45.457
 
 
 
 
 
 
 
 
 
646
  - type: map_at_1
647
  value: 27.707749999999997
648
  - type: map_at_10
 
703
  value: 40.39083333333334
704
  - type: recall_at_5
705
  value: 46.40083333333333
 
 
 
 
 
 
 
 
 
706
  - type: map_at_1
707
  value: 26.482
708
  - type: map_at_10
 
763
  value: 36.65
764
  - type: recall_at_5
765
  value: 40.774
 
 
 
 
 
 
 
 
 
766
  - type: map_at_1
767
  value: 18.815
768
  - type: map_at_10
 
823
  value: 29.694
824
  - type: recall_at_5
825
  value: 34.935
 
 
 
 
 
 
 
 
 
826
  - type: map_at_1
827
  value: 27.840999999999998
828
  - type: map_at_10
 
883
  value: 40.146
884
  - type: recall_at_5
885
  value: 44.951
 
 
 
 
 
 
 
 
 
886
  - type: map_at_1
887
  value: 26.529000000000003
888
  - type: map_at_10
 
943
  value: 36.986000000000004
944
  - type: recall_at_5
945
  value: 43.096000000000004
 
 
 
 
 
 
 
 
 
946
  - type: map_at_1
947
  value: 23.480999999999998
948
  - type: map_at_10
 
1006
  - task:
1007
  type: Retrieval
1008
  dataset:
 
1009
  name: MTEB ClimateFEVER
1010
+ type: climate-fever
1011
  config: default
1012
  split: test
1013
  revision: None
 
1075
  - task:
1076
  type: Retrieval
1077
  dataset:
 
1078
  name: MTEB DBPedia
1079
+ type: dbpedia-entity
1080
  config: default
1081
  split: test
1082
  revision: None
 
1144
  - task:
1145
  type: Classification
1146
  dataset:
 
1147
  name: MTEB EmotionClassification
1148
+ type: mteb/emotion
1149
  config: default
1150
  split: test
1151
  revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
 
1157
  - task:
1158
  type: Retrieval
1159
  dataset:
 
1160
  name: MTEB FEVER
1161
+ type: fever
1162
  config: default
1163
  split: test
1164
  revision: None
 
1226
  - task:
1227
  type: Retrieval
1228
  dataset:
 
1229
  name: MTEB FiQA2018
1230
+ type: fiqa
1231
  config: default
1232
  split: test
1233
  revision: None
 
1295
  - task:
1296
  type: Retrieval
1297
  dataset:
 
1298
  name: MTEB HotpotQA
1299
+ type: hotpotqa
1300
  config: default
1301
  split: test
1302
  revision: None
 
1364
  - task:
1365
  type: Classification
1366
  dataset:
 
1367
  name: MTEB ImdbClassification
1368
+ type: mteb/imdb
1369
  config: default
1370
  split: test
1371
  revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
 
1379
  - task:
1380
  type: Retrieval
1381
  dataset:
 
1382
  name: MTEB MSMARCO
1383
+ type: msmarco
1384
  config: default
1385
  split: dev
1386
  revision: None
 
1448
  - task:
1449
  type: Classification
1450
  dataset:
 
1451
  name: MTEB MTOPDomainClassification (en)
1452
+ type: mteb/mtop_domain
1453
  config: en
1454
  split: test
1455
  revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
 
1461
  - task:
1462
  type: Classification
1463
  dataset:
 
1464
  name: MTEB MTOPIntentClassification (en)
1465
+ type: mteb/mtop_intent
1466
  config: en
1467
  split: test
1468
  revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
 
1474
  - task:
1475
  type: Classification
1476
  dataset:
 
1477
  name: MTEB MassiveIntentClassification (en)
1478
+ type: mteb/amazon_massive_intent
1479
  config: en
1480
  split: test
1481
  revision: 31efe3c427b0bae9c22cbb560b8f15491cc6bed7
 
1487
  - task:
1488
  type: Classification
1489
  dataset:
 
1490
  name: MTEB MassiveScenarioClassification (en)
1491
+ type: mteb/amazon_massive_scenario
1492
  config: en
1493
  split: test
1494
  revision: 7d571f92784cd94a019292a1f45445077d0ef634
 
1500
  - task:
1501
  type: Clustering
1502
  dataset:
 
1503
  name: MTEB MedrxivClusteringP2P
1504
+ type: mteb/medrxiv-clustering-p2p
1505
  config: default
1506
  split: test
1507
  revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
 
1511
  - task:
1512
  type: Clustering
1513
  dataset:
 
1514
  name: MTEB MedrxivClusteringS2S
1515
+ type: mteb/medrxiv-clustering-s2s
1516
  config: default
1517
  split: test
1518
  revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
 
1522
  - task:
1523
  type: Reranking
1524
  dataset:
 
1525
  name: MTEB MindSmallReranking
1526
+ type: mteb/mind_small
1527
  config: default
1528
  split: test
1529
  revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
 
1535
  - task:
1536
  type: Retrieval
1537
  dataset:
 
1538
  name: MTEB NFCorpus
1539
+ type: nfcorpus
1540
  config: default
1541
  split: test
1542
  revision: None
 
1604
  - task:
1605
  type: Retrieval
1606
  dataset:
 
1607
  name: MTEB NQ
1608
+ type: nq
1609
  config: default
1610
  split: test
1611
  revision: None
 
1673
  - task:
1674
  type: Retrieval
1675
  dataset:
 
1676
  name: MTEB QuoraRetrieval
1677
+ type: quora
1678
  config: default
1679
  split: test
1680
  revision: None
 
1742
  - task:
1743
  type: Clustering
1744
  dataset:
 
1745
  name: MTEB RedditClustering
1746
+ type: mteb/reddit-clustering
1747
  config: default
1748
  split: test
1749
  revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
 
1753
  - task:
1754
  type: Clustering
1755
  dataset:
 
1756
  name: MTEB RedditClusteringP2P
1757
+ type: mteb/reddit-clustering-p2p
1758
  config: default
1759
  split: test
1760
  revision: 282350215ef01743dc01b456c7f5241fa8937f16
 
1764
  - task:
1765
  type: Retrieval
1766
  dataset:
 
1767
  name: MTEB SCIDOCS
1768
+ type: scidocs
1769
  config: default
1770
  split: test
1771
  revision: None
 
1833
  - task:
1834
  type: STS
1835
  dataset:
 
1836
  name: MTEB SICK-R
1837
+ type: mteb/sickr-sts
1838
  config: default
1839
  split: test
1840
  revision: a6ea5a8cab320b040a23452cc28066d9beae2cee
 
1854
  - task:
1855
  type: STS
1856
  dataset:
 
1857
  name: MTEB STS12
1858
+ type: mteb/sts12-sts
1859
  config: default
1860
  split: test
1861
  revision: a0d554a64d88156834ff5ae9920b964011b16384
 
1875
  - task:
1876
  type: STS
1877
  dataset:
 
1878
  name: MTEB STS13
1879
+ type: mteb/sts13-sts
1880
  config: default
1881
  split: test
1882
  revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
 
1896
  - task:
1897
  type: STS
1898
  dataset:
 
1899
  name: MTEB STS14
1900
+ type: mteb/sts14-sts
1901
  config: default
1902
  split: test
1903
  revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
 
1917
  - task:
1918
  type: STS
1919
  dataset:
 
1920
  name: MTEB STS15
1921
+ type: mteb/sts15-sts
1922
  config: default
1923
  split: test
1924
  revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
 
1938
  - task:
1939
  type: STS
1940
  dataset:
 
1941
  name: MTEB STS16
1942
+ type: mteb/sts16-sts
1943
  config: default
1944
  split: test
1945
  revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
 
1959
  - task:
1960
  type: STS
1961
  dataset:
 
1962
  name: MTEB STS17 (en-en)
1963
+ type: mteb/sts17-crosslingual-sts
1964
  config: en-en
1965
  split: test
1966
  revision: af5e6fb845001ecf41f4c1e033ce921939a2a68d
 
1980
  - task:
1981
  type: STS
1982
  dataset:
 
1983
  name: MTEB STS22 (en)
1984
+ type: mteb/sts22-crosslingual-sts
1985
  config: en
1986
  split: test
1987
  revision: 6d1ba47164174a496b7fa5d3569dae26a6813b80
 
2001
  - task:
2002
  type: STS
2003
  dataset:
 
2004
  name: MTEB STSBenchmark
2005
+ type: mteb/stsbenchmark-sts
2006
  config: default
2007
  split: test
2008
  revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
 
2022
  - task:
2023
  type: Reranking
2024
  dataset:
 
2025
  name: MTEB SciDocsRR
2026
+ type: mteb/scidocs-reranking
2027
  config: default
2028
  split: test
2029
  revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
 
2035
  - task:
2036
  type: Retrieval
2037
  dataset:
 
2038
  name: MTEB SciFact
2039
+ type: scifact
2040
  config: default
2041
  split: test
2042
  revision: None
 
2104
  - task:
2105
  type: PairClassification
2106
  dataset:
 
2107
  name: MTEB SprintDuplicateQuestions
2108
+ type: mteb/sprintduplicatequestions-pairclassification
2109
  config: default
2110
  split: test
2111
  revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
 
2159
  - task:
2160
  type: Clustering
2161
  dataset:
 
2162
  name: MTEB StackExchangeClustering
2163
+ type: mteb/stackexchange-clustering
2164
  config: default
2165
  split: test
2166
  revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
 
2170
  - task:
2171
  type: Clustering
2172
  dataset:
 
2173
  name: MTEB StackExchangeClusteringP2P
2174
+ type: mteb/stackexchange-clustering-p2p
2175
  config: default
2176
  split: test
2177
  revision: 815ca46b2622cec33ccafc3735d572c266efdb44
 
2181
  - task:
2182
  type: Reranking
2183
  dataset:
 
2184
  name: MTEB StackOverflowDupQuestions
2185
+ type: mteb/stackoverflowdupquestions-reranking
2186
  config: default
2187
  split: test
2188
  revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
 
2194
  - task:
2195
  type: Summarization
2196
  dataset:
 
2197
  name: MTEB SummEval
2198
+ type: mteb/summeval
2199
  config: default
2200
  split: test
2201
  revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
 
2211
  - task:
2212
  type: Retrieval
2213
  dataset:
 
2214
  name: MTEB TRECCOVID
2215
+ type: trec-covid
2216
  config: default
2217
  split: test
2218
  revision: None
 
2280
  - task:
2281
  type: Retrieval
2282
  dataset:
 
2283
  name: MTEB Touche2020
2284
+ type: webis-touche2020
2285
  config: default
2286
  split: test
2287
  revision: None
 
2349
  - task:
2350
  type: Classification
2351
  dataset:
 
2352
  name: MTEB ToxicConversationsClassification
2353
+ type: mteb/toxic_conversations_50k
2354
  config: default
2355
  split: test
2356
  revision: d7c0de2777da35d6aae2200a62c6e0e5af397c4c
 
2364
  - task:
2365
  type: Classification
2366
  dataset:
 
2367
  name: MTEB TweetSentimentExtractionClassification
2368
+ type: mteb/tweet_sentiment_extraction
2369
  config: default
2370
  split: test
2371
  revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
 
2377
  - task:
2378
  type: Clustering
2379
  dataset:
 
2380
  name: MTEB TwentyNewsgroupsClustering
2381
+ type: mteb/twentynewsgroups-clustering
2382
  config: default
2383
  split: test
2384
  revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
 
2388
  - task:
2389
  type: PairClassification
2390
  dataset:
 
2391
  name: MTEB TwitterSemEval2015
2392
+ type: mteb/twittersemeval2015-pairclassification
2393
  config: default
2394
  split: test
2395
  revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
 
2443
  - task:
2444
  type: PairClassification
2445
  dataset:
 
2446
  name: MTEB TwitterURLCorpus
2447
+ type: mteb/twitterurlcorpus-pairclassification
2448
  config: default
2449
  split: test
2450
  revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
 
2495
  value: 85.64591703003417
2496
  - type: max_f1
2497
  value: 77.59531005352656
 
 
 
2498
  ---
2499
 
2500