Muennighoff commited on
Commit
5d4e702
1 Parent(s): 7853d0d

Add MTEB evaluation

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. {eval → evaluation/beir}/beir.json +0 -0
  2. evaluation/mteb/AmazonCounterfactualClassification.json +16 -0
  3. evaluation/mteb/AmazonPolarityClassification.json +14 -0
  4. evaluation/mteb/AmazonReviewsClassification.json +14 -0
  5. evaluation/mteb/ArguAna.json +37 -0
  6. evaluation/mteb/ArxivClusteringP2P.json +9 -0
  7. evaluation/mteb/ArxivClusteringS2S.json +9 -0
  8. evaluation/mteb/AskUbuntuDupQuestions.json +9 -0
  9. evaluation/mteb/BIOSSES.json +19 -0
  10. evaluation/mteb/Banking77Classification.json +12 -0
  11. evaluation/mteb/BiorxivClusteringP2P.json +9 -0
  12. evaluation/mteb/BiorxivClusteringS2S.json +9 -0
  13. evaluation/mteb/CQADupstackAndroidRetrieval.json +37 -0
  14. evaluation/mteb/CQADupstackEnglishRetrieval.json +37 -0
  15. evaluation/mteb/CQADupstackGamingRetrieval.json +37 -0
  16. evaluation/mteb/CQADupstackGisRetrieval.json +37 -0
  17. evaluation/mteb/CQADupstackMathematicaRetrieval.json +37 -0
  18. evaluation/mteb/CQADupstackPhysicsRetrieval.json +37 -0
  19. evaluation/mteb/CQADupstackProgrammersRetrieval.json +37 -0
  20. evaluation/mteb/CQADupstackRetrieval.json +1 -0
  21. evaluation/mteb/CQADupstackStatsRetrieval.json +37 -0
  22. evaluation/mteb/CQADupstackTexRetrieval.json +37 -0
  23. evaluation/mteb/CQADupstackUnixRetrieval.json +37 -0
  24. evaluation/mteb/CQADupstackWebmastersRetrieval.json +37 -0
  25. evaluation/mteb/CQADupstackWordpressRetrieval.json +37 -0
  26. evaluation/mteb/ClimateFEVER.json +37 -0
  27. evaluation/mteb/DBPedia.json +37 -0
  28. evaluation/mteb/EmotionClassification.json +12 -0
  29. evaluation/mteb/FEVER.json +37 -0
  30. evaluation/mteb/FiQA2018.json +37 -0
  31. evaluation/mteb/HotpotQA.json +37 -0
  32. evaluation/mteb/ImdbClassification.json +14 -0
  33. evaluation/mteb/MSMARCO.json +37 -0
  34. evaluation/mteb/MTOPDomainClassification.json +14 -0
  35. evaluation/mteb/MTOPIntentClassification.json +14 -0
  36. evaluation/mteb/MassiveIntentClassification.json +14 -0
  37. evaluation/mteb/MassiveScenarioClassification.json +14 -0
  38. evaluation/mteb/MedrxivClusteringP2P.json +9 -0
  39. evaluation/mteb/MedrxivClusteringS2S.json +9 -0
  40. evaluation/mteb/MindSmallReranking.json +9 -0
  41. evaluation/mteb/NFCorpus.json +37 -0
  42. evaluation/mteb/NQ.json +37 -0
  43. evaluation/mteb/QuoraRetrieval.json +37 -0
  44. evaluation/mteb/RedditClustering.json +9 -0
  45. evaluation/mteb/RedditClusteringP2P.json +9 -0
  46. evaluation/mteb/SCIDOCS.json +37 -0
  47. evaluation/mteb/SGPT-1.3B-weightedmean-msmarco-specb-bitfit_results.csv +355 -0
  48. evaluation/mteb/SICK-R.json +19 -0
  49. evaluation/mteb/STS12.json +19 -0
  50. evaluation/mteb/STS13.json +19 -0
{eval → evaluation/beir}/beir.json RENAMED
File without changes
evaluation/mteb/AmazonCounterfactualClassification.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.652089552238806,
7
+ "accuracy_stderr": 0.04707742824740793,
8
+ "ap": 0.2959212705444778,
9
+ "ap_stderr": 0.022393345886320606,
10
+ "f1": 0.5997099864321921,
11
+ "f1_stderr": 0.036697739411917986,
12
+ "main_score": 0.652089552238806
13
+ },
14
+ "evaluation_time": 23.71
15
+ }
16
+ }
evaluation/mteb/AmazonPolarityClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.7320565,
6
+ "accuracy_stderr": 0.04094219950430119,
7
+ "ap": 0.6736680643550963,
8
+ "ap_stderr": 0.03652809962256317,
9
+ "evaluation_time": 7801.59,
10
+ "f1": 0.7290420520325125,
11
+ "f1_stderr": 0.04396494850187113,
12
+ "main_score": 0.7320565
13
+ }
14
+ }
evaluation/mteb/AmazonReviewsClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.34956,
7
+ "accuracy_stderr": 0.018705464442242543,
8
+ "f1": 0.3471932443769695,
9
+ "f1_stderr": 0.017698150667922033,
10
+ "main_score": 0.34956
11
+ },
12
+ "evaluation_time": 73.75
13
+ }
14
+ }
evaluation/mteb/ArguAna.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 159.23,
6
+ "map_at_1": 0.26102,
7
+ "map_at_10": 0.40958,
8
+ "map_at_100": 0.42033,
9
+ "map_at_1000": 0.42042,
10
+ "map_at_3": 0.36332,
11
+ "map_at_5": 0.38608,
12
+ "mrr_at_1": 0.26387,
13
+ "mrr_at_10": 0.41051,
14
+ "mrr_at_100": 0.42118,
15
+ "mrr_at_1000": 0.42127,
16
+ "mrr_at_3": 0.36415,
17
+ "mrr_at_5": 0.3872,
18
+ "ndcg_at_1": 0.26102,
19
+ "ndcg_at_10": 0.4968,
20
+ "ndcg_at_100": 0.54258,
21
+ "ndcg_at_1000": 0.54486,
22
+ "ndcg_at_3": 0.39864,
23
+ "ndcg_at_5": 0.4398,
24
+ "precision_at_1": 0.26102,
25
+ "precision_at_10": 0.07781,
26
+ "precision_at_100": 0.00979,
27
+ "precision_at_1000": 0.001,
28
+ "precision_at_3": 0.16714,
29
+ "precision_at_5": 0.12034,
30
+ "recall_at_1": 0.26102,
31
+ "recall_at_10": 0.77809,
32
+ "recall_at_100": 0.97866,
33
+ "recall_at_1000": 0.99644,
34
+ "recall_at_3": 0.50142,
35
+ "recall_at_5": 0.60171
36
+ }
37
+ }
evaluation/mteb/ArxivClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 28476.56,
6
+ "v_measure": 0.4338419491695377,
7
+ "v_measure_std": 0.13772932292188322
8
+ }
9
+ }
evaluation/mteb/ArxivClusteringS2S.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 3597.82,
6
+ "v_measure": 0.3370962633433912,
7
+ "v_measure_std": 0.14057785790111033
8
+ }
9
+ }
evaluation/mteb/AskUbuntuDupQuestions.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 29.27,
6
+ "map": 0.5813305899687008,
7
+ "mrr": 0.7210922041946972
8
+ }
9
+ }
evaluation/mteb/BIOSSES.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.8662153841660047,
7
+ "spearman": 0.8301514456843275
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.8600431518427242,
11
+ "spearman": 0.8385552516285784
12
+ },
13
+ "evaluation_time": 4.47,
14
+ "manhattan": {
15
+ "pearson": 0.8583025803351181,
16
+ "spearman": 0.8386636878343106
17
+ }
18
+ }
19
+ }
evaluation/mteb/Banking77Classification.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.8205844155844156,
6
+ "accuracy_stderr": 0.00898031054024437,
7
+ "evaluation_time": 70.71,
8
+ "f1": 0.8201858378847641,
9
+ "f1_stderr": 0.009423967637409204,
10
+ "main_score": 0.8205844155844156
11
+ }
12
+ }
evaluation/mteb/BiorxivClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 3352.83,
6
+ "v_measure": 0.3505918333141837,
7
+ "v_measure_std": 0.00847894603883707
8
+ }
9
+ }
evaluation/mteb/BiorxivClusteringS2S.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 435.49,
6
+ "v_measure": 0.3071055028830579,
7
+ "v_measure_std": 0.008981834294010968
8
+ }
9
+ }
evaluation/mteb/CQADupstackAndroidRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 575.19,
6
+ "map_at_1": 0.26519,
7
+ "map_at_10": 0.35634,
8
+ "map_at_100": 0.36961,
9
+ "map_at_1000": 0.37088,
10
+ "map_at_3": 0.32254,
11
+ "map_at_5": 0.3422,
12
+ "mrr_at_1": 0.32332,
13
+ "mrr_at_10": 0.41168,
14
+ "mrr_at_100": 0.41977,
15
+ "mrr_at_1000": 0.42029,
16
+ "mrr_at_3": 0.38197,
17
+ "mrr_at_5": 0.40036,
18
+ "ndcg_at_1": 0.32332,
19
+ "ndcg_at_10": 0.41471,
20
+ "ndcg_at_100": 0.46956,
21
+ "ndcg_at_1000": 0.49262,
22
+ "ndcg_at_3": 0.35938,
23
+ "ndcg_at_5": 0.38703,
24
+ "precision_at_1": 0.32332,
25
+ "precision_at_10": 0.07783,
26
+ "precision_at_100": 0.0129,
27
+ "precision_at_1000": 0.00178,
28
+ "precision_at_3": 0.16834,
29
+ "precision_at_5": 0.12418,
30
+ "recall_at_1": 0.26519,
31
+ "recall_at_10": 0.5319,
32
+ "recall_at_100": 0.76565,
33
+ "recall_at_1000": 0.91478,
34
+ "recall_at_3": 0.38034,
35
+ "recall_at_5": 0.45246
36
+ }
37
+ }
evaluation/mteb/CQADupstackEnglishRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 874.22,
6
+ "map_at_1": 0.25356,
7
+ "map_at_10": 0.34596,
8
+ "map_at_100": 0.35714,
9
+ "map_at_1000": 0.3584,
10
+ "map_at_3": 0.32073,
11
+ "map_at_5": 0.33475,
12
+ "mrr_at_1": 0.31274,
13
+ "mrr_at_10": 0.39592,
14
+ "mrr_at_100": 0.40284,
15
+ "mrr_at_1000": 0.4034,
16
+ "mrr_at_3": 0.37378,
17
+ "mrr_at_5": 0.38658,
18
+ "ndcg_at_1": 0.31274,
19
+ "ndcg_at_10": 0.39766,
20
+ "ndcg_at_100": 0.44028,
21
+ "ndcg_at_1000": 0.46445,
22
+ "ndcg_at_3": 0.35934,
23
+ "ndcg_at_5": 0.37751,
24
+ "precision_at_1": 0.31274,
25
+ "precision_at_10": 0.07452,
26
+ "precision_at_100": 0.01217,
27
+ "precision_at_1000": 0.0017,
28
+ "precision_at_3": 0.17431,
29
+ "precision_at_5": 0.12306,
30
+ "recall_at_1": 0.25356,
31
+ "recall_at_10": 0.49344,
32
+ "recall_at_100": 0.67497,
33
+ "recall_at_1000": 0.83372,
34
+ "recall_at_3": 0.38227,
35
+ "recall_at_5": 0.43188
36
+ }
37
+ }
evaluation/mteb/CQADupstackGamingRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 931.63,
6
+ "map_at_1": 0.32759,
7
+ "map_at_10": 0.43937,
8
+ "map_at_100": 0.45004,
9
+ "map_at_1000": 0.4507,
10
+ "map_at_3": 0.40805,
11
+ "map_at_5": 0.42497,
12
+ "mrr_at_1": 0.37367,
13
+ "mrr_at_10": 0.47237,
14
+ "mrr_at_100": 0.47973,
15
+ "mrr_at_1000": 0.48011,
16
+ "mrr_at_3": 0.4465,
17
+ "mrr_at_5": 0.46051,
18
+ "ndcg_at_1": 0.37367,
19
+ "ndcg_at_10": 0.49659,
20
+ "ndcg_at_100": 0.54069,
21
+ "ndcg_at_1000": 0.55552,
22
+ "ndcg_at_3": 0.44169,
23
+ "ndcg_at_5": 0.46726,
24
+ "precision_at_1": 0.37367,
25
+ "precision_at_10": 0.08163,
26
+ "precision_at_100": 0.01133,
27
+ "precision_at_1000": 0.00131,
28
+ "precision_at_3": 0.19707,
29
+ "precision_at_5": 0.13718,
30
+ "recall_at_1": 0.32759,
31
+ "recall_at_10": 0.63341,
32
+ "recall_at_100": 0.82502,
33
+ "recall_at_1000": 0.93259,
34
+ "recall_at_3": 0.48796,
35
+ "recall_at_5": 0.54921
36
+ }
37
+ }
evaluation/mteb/CQADupstackGisRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1290.88,
6
+ "map_at_1": 0.18962,
7
+ "map_at_10": 0.25863,
8
+ "map_at_100": 0.26818,
9
+ "map_at_1000": 0.26918,
10
+ "map_at_3": 0.23043,
11
+ "map_at_5": 0.24599,
12
+ "mrr_at_1": 0.20452,
13
+ "mrr_at_10": 0.27301,
14
+ "mrr_at_100": 0.28233,
15
+ "mrr_at_1000": 0.2831,
16
+ "mrr_at_3": 0.24539,
17
+ "mrr_at_5": 0.26109,
18
+ "ndcg_at_1": 0.20452,
19
+ "ndcg_at_10": 0.30355,
20
+ "ndcg_at_100": 0.35336,
21
+ "ndcg_at_1000": 0.37927,
22
+ "ndcg_at_3": 0.24705,
23
+ "ndcg_at_5": 0.2742,
24
+ "precision_at_1": 0.20452,
25
+ "precision_at_10": 0.04949,
26
+ "precision_at_100": 0.0078,
27
+ "precision_at_1000": 0.00104,
28
+ "precision_at_3": 0.10358,
29
+ "precision_at_5": 0.07774,
30
+ "recall_at_1": 0.18962,
31
+ "recall_at_10": 0.43056,
32
+ "recall_at_100": 0.66273,
33
+ "recall_at_1000": 0.8596,
34
+ "recall_at_3": 0.27776,
35
+ "recall_at_5": 0.34287
36
+ }
37
+ }
evaluation/mteb/CQADupstackMathematicaRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 686.89,
6
+ "map_at_1": 0.1124,
7
+ "map_at_10": 0.18503,
8
+ "map_at_100": 0.19553,
9
+ "map_at_1000": 0.1969,
10
+ "map_at_3": 0.1615,
11
+ "map_at_5": 0.17254,
12
+ "mrr_at_1": 0.13806,
13
+ "mrr_at_10": 0.21939,
14
+ "mrr_at_100": 0.22827,
15
+ "mrr_at_1000": 0.22911,
16
+ "mrr_at_3": 0.1932,
17
+ "mrr_at_5": 0.20558,
18
+ "ndcg_at_1": 0.13806,
19
+ "ndcg_at_10": 0.23383,
20
+ "ndcg_at_100": 0.28834,
21
+ "ndcg_at_1000": 0.32175,
22
+ "ndcg_at_3": 0.18652,
23
+ "ndcg_at_5": 0.20505,
24
+ "precision_at_1": 0.13806,
25
+ "precision_at_10": 0.04714,
26
+ "precision_at_100": 0.00864,
27
+ "precision_at_1000": 0.0013,
28
+ "precision_at_3": 0.09328,
29
+ "precision_at_5": 0.06841,
30
+ "recall_at_1": 0.1124,
31
+ "recall_at_10": 0.34854,
32
+ "recall_at_100": 0.59503,
33
+ "recall_at_1000": 0.8325,
34
+ "recall_at_3": 0.2202,
35
+ "recall_at_5": 0.26715
36
+ }
37
+ }
evaluation/mteb/CQADupstackPhysicsRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1269.26,
6
+ "map_at_1": 0.23012,
7
+ "map_at_10": 0.33048,
8
+ "map_at_100": 0.34371,
9
+ "map_at_1000": 0.34489,
10
+ "map_at_3": 0.29943,
11
+ "map_at_5": 0.31602,
12
+ "mrr_at_1": 0.28104,
13
+ "mrr_at_10": 0.3799,
14
+ "mrr_at_100": 0.38836,
15
+ "mrr_at_1000": 0.38891,
16
+ "mrr_at_3": 0.35226,
17
+ "mrr_at_5": 0.36694,
18
+ "ndcg_at_1": 0.28104,
19
+ "ndcg_at_10": 0.39037,
20
+ "ndcg_at_100": 0.44643,
21
+ "ndcg_at_1000": 0.46939,
22
+ "ndcg_at_3": 0.33784,
23
+ "ndcg_at_5": 0.36126,
24
+ "precision_at_1": 0.28104,
25
+ "precision_at_10": 0.07267,
26
+ "precision_at_100": 0.01193,
27
+ "precision_at_1000": 0.00159,
28
+ "precision_at_3": 0.16298,
29
+ "precision_at_5": 0.11684,
30
+ "recall_at_1": 0.23012,
31
+ "recall_at_10": 0.52054,
32
+ "recall_at_100": 0.75622,
33
+ "recall_at_1000": 0.90675,
34
+ "recall_at_3": 0.37282,
35
+ "recall_at_5": 0.43307
36
+ }
37
+ }
evaluation/mteb/CQADupstackProgrammersRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1185.95,
6
+ "map_at_1": 0.21624,
7
+ "map_at_10": 0.3021,
8
+ "map_at_100": 0.3152,
9
+ "map_at_1000": 0.31626,
10
+ "map_at_3": 0.26951,
11
+ "map_at_5": 0.28939,
12
+ "mrr_at_1": 0.26941,
13
+ "mrr_at_10": 0.3513,
14
+ "mrr_at_100": 0.3615,
15
+ "mrr_at_1000": 0.36204,
16
+ "mrr_at_3": 0.3242,
17
+ "mrr_at_5": 0.34155,
18
+ "ndcg_at_1": 0.26941,
19
+ "ndcg_at_10": 0.35726,
20
+ "ndcg_at_100": 0.41725,
21
+ "ndcg_at_1000": 0.44105,
22
+ "ndcg_at_3": 0.30184,
23
+ "ndcg_at_5": 0.33176,
24
+ "precision_at_1": 0.26941,
25
+ "precision_at_10": 0.06655,
26
+ "precision_at_100": 0.01152,
27
+ "precision_at_1000": 0.00152,
28
+ "precision_at_3": 0.14346,
29
+ "precision_at_5": 0.10868,
30
+ "recall_at_1": 0.21624,
31
+ "recall_at_10": 0.47359,
32
+ "recall_at_100": 0.73436,
33
+ "recall_at_1000": 0.89988,
34
+ "recall_at_3": 0.3234,
35
+ "recall_at_5": 0.39856
36
+ }
37
+ }
evaluation/mteb/CQADupstackRetrieval.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"dataset_version": null, "mteb_version": "0.0.2", "test": {"evaluation_time": 1798.61, "map_at_1": 0.2067566666666667, "map_at_10": 0.28479333333333334, "map_at_100": 0.29612249999999996, "map_at_1000": 0.29731166666666664, "map_at_3": 0.25884, "map_at_5": 0.27298916666666667, "mrr_at_1": 0.24402583333333333, "mrr_at_10": 0.3207041666666667, "mrr_at_100": 0.32958416666666673, "mrr_at_1000": 0.3302541666666666, "mrr_at_3": 0.29677749999999997, "mrr_at_5": 0.3102391666666667, "ndcg_at_1": 0.24402583333333333, "ndcg_at_10": 0.3332616666666667, "ndcg_at_100": 0.38515666666666665, "ndcg_at_1000": 0.4113791666666667, "ndcg_at_3": 0.28687749999999995, "ndcg_at_5": 0.3084766666666667, "precision_at_1": 0.24402583333333333, "precision_at_10": 0.05943749999999999, "precision_at_100": 0.010098333333333334, "precision_at_1000": 0.0014183333333333333, "precision_at_3": 0.132115, "precision_at_5": 0.09548416666666668, "recall_at_1": 0.2067566666666667, "recall_at_10": 0.4424558333333334, "recall_at_100": 0.6731116666666667, "recall_at_1000": 0.8587841666666666, "recall_at_3": 0.3149258333333333, "recall_at_5": 0.3693241666666667}}
evaluation/mteb/CQADupstackStatsRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1614.26,
6
+ "map_at_1": 0.1834,
7
+ "map_at_10": 0.23988,
8
+ "map_at_100": 0.24895,
9
+ "map_at_1000": 0.24992,
10
+ "map_at_3": 0.21831,
11
+ "map_at_5": 0.23,
12
+ "mrr_at_1": 0.20399,
13
+ "mrr_at_10": 0.26186,
14
+ "mrr_at_100": 0.27018,
15
+ "mrr_at_1000": 0.27091,
16
+ "mrr_at_3": 0.2408,
17
+ "mrr_at_5": 0.2523,
18
+ "ndcg_at_1": 0.20399,
19
+ "ndcg_at_10": 0.27799,
20
+ "ndcg_at_100": 0.32579,
21
+ "ndcg_at_1000": 0.35209,
22
+ "ndcg_at_3": 0.23684,
23
+ "ndcg_at_5": 0.25521,
24
+ "precision_at_1": 0.20399,
25
+ "precision_at_10": 0.04586,
26
+ "precision_at_100": 0.00755,
27
+ "precision_at_1000": 0.00105,
28
+ "precision_at_3": 0.10276,
29
+ "precision_at_5": 0.07362,
30
+ "recall_at_1": 0.1834,
31
+ "recall_at_10": 0.37456,
32
+ "recall_at_100": 0.5986,
33
+ "recall_at_1000": 0.79703,
34
+ "recall_at_3": 0.26164,
35
+ "recall_at_5": 0.30652
36
+ }
37
+ }
evaluation/mteb/CQADupstackTexRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 2711.63,
6
+ "map_at_1": 0.12327,
7
+ "map_at_10": 0.17572,
8
+ "map_at_100": 0.18534,
9
+ "map_at_1000": 0.18653,
10
+ "map_at_3": 0.15703,
11
+ "map_at_5": 0.16752,
12
+ "mrr_at_1": 0.15038,
13
+ "mrr_at_10": 0.20726,
14
+ "mrr_at_100": 0.2161,
15
+ "mrr_at_1000": 0.21695,
16
+ "mrr_at_3": 0.18829,
17
+ "mrr_at_5": 0.19885,
18
+ "ndcg_at_1": 0.15038,
19
+ "ndcg_at_10": 0.21241,
20
+ "ndcg_at_100": 0.26179,
21
+ "ndcg_at_1000": 0.29316,
22
+ "ndcg_at_3": 0.17762,
23
+ "ndcg_at_5": 0.19413,
24
+ "precision_at_1": 0.15038,
25
+ "precision_at_10": 0.03892,
26
+ "precision_at_100": 0.0075,
27
+ "precision_at_1000": 0.00118,
28
+ "precision_at_3": 0.08351,
29
+ "precision_at_5": 0.06187,
30
+ "recall_at_1": 0.12327,
31
+ "recall_at_10": 0.29342,
32
+ "recall_at_100": 0.51854,
33
+ "recall_at_1000": 0.74648,
34
+ "recall_at_3": 0.19596,
35
+ "recall_at_5": 0.23899
36
+ }
37
+ }
evaluation/mteb/CQADupstackUnixRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1688.62,
6
+ "map_at_1": 0.20594,
7
+ "map_at_10": 0.27879,
8
+ "map_at_100": 0.28926,
9
+ "map_at_1000": 0.29041,
10
+ "map_at_3": 0.25669,
11
+ "map_at_5": 0.26774,
12
+ "mrr_at_1": 0.23694,
13
+ "mrr_at_10": 0.31335,
14
+ "mrr_at_100": 0.32218,
15
+ "mrr_at_1000": 0.32298,
16
+ "mrr_at_3": 0.2926,
17
+ "mrr_at_5": 0.30328,
18
+ "ndcg_at_1": 0.23694,
19
+ "ndcg_at_10": 0.32456,
20
+ "ndcg_at_100": 0.37667,
21
+ "ndcg_at_1000": 0.40571,
22
+ "ndcg_at_3": 0.28283,
23
+ "ndcg_at_5": 0.29986,
24
+ "precision_at_1": 0.23694,
25
+ "precision_at_10": 0.05448,
26
+ "precision_at_100": 0.00912,
27
+ "precision_at_1000": 0.00127,
28
+ "precision_at_3": 0.12718,
29
+ "precision_at_5": 0.08843,
30
+ "recall_at_1": 0.20594,
31
+ "recall_at_10": 0.43005,
32
+ "recall_at_100": 0.66228,
33
+ "recall_at_1000": 0.87171,
34
+ "recall_at_3": 0.31554,
35
+ "recall_at_5": 0.35838
36
+ }
37
+ }
evaluation/mteb/CQADupstackWebmastersRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 540.56,
6
+ "map_at_1": 0.20856,
7
+ "map_at_10": 0.28372,
8
+ "map_at_100": 0.2987,
9
+ "map_at_1000": 0.30075,
10
+ "map_at_3": 0.26054,
11
+ "map_at_5": 0.27129,
12
+ "mrr_at_1": 0.25494,
13
+ "mrr_at_10": 0.32735,
14
+ "mrr_at_100": 0.33794,
15
+ "mrr_at_1000": 0.3385,
16
+ "mrr_at_3": 0.30731,
17
+ "mrr_at_5": 0.31897,
18
+ "ndcg_at_1": 0.25494,
19
+ "ndcg_at_10": 0.33385,
20
+ "ndcg_at_100": 0.39436,
21
+ "ndcg_at_1000": 0.42313,
22
+ "ndcg_at_3": 0.29612,
23
+ "ndcg_at_5": 0.31187,
24
+ "precision_at_1": 0.25494,
25
+ "precision_at_10": 0.06423,
26
+ "precision_at_100": 0.01383,
27
+ "precision_at_1000": 0.00224,
28
+ "precision_at_3": 0.13834,
29
+ "precision_at_5": 0.1,
30
+ "recall_at_1": 0.20856,
31
+ "recall_at_10": 0.42678,
32
+ "recall_at_100": 0.70224,
33
+ "recall_at_1000": 0.89369,
34
+ "recall_at_3": 0.31957,
35
+ "recall_at_5": 0.36026
36
+ }
37
+ }
evaluation/mteb/CQADupstackWordpressRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1798.61,
6
+ "map_at_1": 0.16519,
7
+ "map_at_10": 0.2215,
8
+ "map_at_100": 0.23181,
9
+ "map_at_1000": 0.23292,
10
+ "map_at_3": 0.20132,
11
+ "map_at_5": 0.21346,
12
+ "mrr_at_1": 0.1793,
13
+ "mrr_at_10": 0.23506,
14
+ "mrr_at_100": 0.24581,
15
+ "mrr_at_1000": 0.24675,
16
+ "mrr_at_3": 0.21503,
17
+ "mrr_at_5": 0.22686,
18
+ "ndcg_at_1": 0.1793,
19
+ "ndcg_at_10": 0.25636,
20
+ "ndcg_at_100": 0.30736,
21
+ "ndcg_at_1000": 0.33841,
22
+ "ndcg_at_3": 0.21546,
23
+ "ndcg_at_5": 0.23658,
24
+ "precision_at_1": 0.1793,
25
+ "precision_at_10": 0.03993,
26
+ "precision_at_100": 0.00689,
27
+ "precision_at_1000": 0.00104,
28
+ "precision_at_3": 0.09057,
29
+ "precision_at_5": 0.0658,
30
+ "recall_at_1": 0.16519,
31
+ "recall_at_10": 0.35268,
32
+ "recall_at_100": 0.5817,
33
+ "recall_at_1000": 0.81668,
34
+ "recall_at_3": 0.24165,
35
+ "recall_at_5": 0.29254
36
+ }
37
+ }
evaluation/mteb/ClimateFEVER.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 16391.42,
6
+ "map_at_1": 0.10363,
7
+ "map_at_10": 0.18301,
8
+ "map_at_100": 0.20019,
9
+ "map_at_1000": 0.20207,
10
+ "map_at_3": 0.14877,
11
+ "map_at_5": 0.16544,
12
+ "mrr_at_1": 0.22866,
13
+ "mrr_at_10": 0.34935,
14
+ "mrr_at_100": 0.35802,
15
+ "mrr_at_1000": 0.3584,
16
+ "mrr_at_3": 0.30966,
17
+ "mrr_at_5": 0.33204,
18
+ "ndcg_at_1": 0.22866,
19
+ "ndcg_at_10": 0.26595,
20
+ "ndcg_at_100": 0.33514,
21
+ "ndcg_at_1000": 0.36872,
22
+ "ndcg_at_3": 0.20667,
23
+ "ndcg_at_5": 0.22728,
24
+ "precision_at_1": 0.22866,
25
+ "precision_at_10": 0.08632,
26
+ "precision_at_100": 0.01612,
27
+ "precision_at_1000": 0.00224,
28
+ "precision_at_3": 0.15505,
29
+ "precision_at_5": 0.12404,
30
+ "recall_at_1": 0.10363,
31
+ "recall_at_10": 0.33494,
32
+ "recall_at_100": 0.57593,
33
+ "recall_at_1000": 0.76342,
34
+ "recall_at_3": 0.19157,
35
+ "recall_at_5": 0.24638
36
+ }
37
+ }
evaluation/mteb/DBPedia.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 11184.99,
6
+ "map_at_1": 0.07436,
7
+ "map_at_10": 0.1476,
8
+ "map_at_100": 0.19206,
9
+ "map_at_1000": 0.20267,
10
+ "map_at_3": 0.10894,
11
+ "map_at_5": 0.12829,
12
+ "mrr_at_1": 0.5425,
13
+ "mrr_at_10": 0.63769,
14
+ "mrr_at_100": 0.64193,
15
+ "mrr_at_1000": 0.64211,
16
+ "mrr_at_3": 0.61458,
17
+ "mrr_at_5": 0.63096,
18
+ "ndcg_at_1": 0.42875,
19
+ "ndcg_at_10": 0.31507,
20
+ "ndcg_at_100": 0.34559,
21
+ "ndcg_at_1000": 0.41246,
22
+ "ndcg_at_3": 0.35058,
23
+ "ndcg_at_5": 0.33396,
24
+ "precision_at_1": 0.5425,
25
+ "precision_at_10": 0.2445,
26
+ "precision_at_100": 0.07383,
27
+ "precision_at_1000": 0.01582,
28
+ "precision_at_3": 0.38083,
29
+ "precision_at_5": 0.326,
30
+ "recall_at_1": 0.07436,
31
+ "recall_at_10": 0.19862,
32
+ "recall_at_100": 0.38981,
33
+ "recall_at_1000": 0.61038,
34
+ "recall_at_3": 0.11949,
35
+ "recall_at_5": 0.15562
36
+ }
37
+ }
evaluation/mteb/EmotionClassification.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.46390000000000003,
6
+ "accuracy_stderr": 0.018785366645343925,
7
+ "evaluation_time": 31.09,
8
+ "f1": 0.42264248858567033,
9
+ "f1_stderr": 0.011565342464001555,
10
+ "main_score": 0.46390000000000003
11
+ }
12
+ }
evaluation/mteb/FEVER.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 17506.78,
6
+ "map_at_1": 0.50916,
7
+ "map_at_10": 0.62258,
8
+ "map_at_100": 0.62741,
9
+ "map_at_1000": 0.62763,
10
+ "map_at_3": 0.60018,
11
+ "map_at_5": 0.6142,
12
+ "mrr_at_1": 0.54965,
13
+ "mrr_at_10": 0.66554,
14
+ "mrr_at_100": 0.66966,
15
+ "mrr_at_1000": 0.66978,
16
+ "mrr_at_3": 0.64414,
17
+ "mrr_at_5": 0.6577,
18
+ "ndcg_at_1": 0.54965,
19
+ "ndcg_at_10": 0.6812,
20
+ "ndcg_at_100": 0.70282,
21
+ "ndcg_at_1000": 0.70788,
22
+ "ndcg_at_3": 0.63862,
23
+ "ndcg_at_5": 0.66216,
24
+ "precision_at_1": 0.54965,
25
+ "precision_at_10": 0.08998,
26
+ "precision_at_100": 0.01016,
27
+ "precision_at_1000": 0.00107,
28
+ "precision_at_3": 0.25618,
29
+ "precision_at_5": 0.16676,
30
+ "recall_at_1": 0.50916,
31
+ "recall_at_10": 0.8204,
32
+ "recall_at_100": 0.91689,
33
+ "recall_at_1000": 0.95349,
34
+ "recall_at_3": 0.70512,
35
+ "recall_at_5": 0.76299
36
+ }
37
+ }
evaluation/mteb/FiQA2018.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 310.86,
6
+ "map_at_1": 0.13568,
7
+ "map_at_10": 0.23264,
8
+ "map_at_100": 0.24824,
9
+ "map_at_1000": 0.25014,
10
+ "map_at_3": 0.19724,
11
+ "map_at_5": 0.21772,
12
+ "mrr_at_1": 0.27315,
13
+ "mrr_at_10": 0.35935,
14
+ "mrr_at_100": 0.36929,
15
+ "mrr_at_1000": 0.36985,
16
+ "mrr_at_3": 0.33591,
17
+ "mrr_at_5": 0.34848,
18
+ "ndcg_at_1": 0.27315,
19
+ "ndcg_at_10": 0.29988,
20
+ "ndcg_at_100": 0.3641,
21
+ "ndcg_at_1000": 0.40185,
22
+ "ndcg_at_3": 0.26342,
23
+ "ndcg_at_5": 0.2768,
24
+ "precision_at_1": 0.27315,
25
+ "precision_at_10": 0.08565,
26
+ "precision_at_100": 0.01508,
27
+ "precision_at_1000": 0.00219,
28
+ "precision_at_3": 0.1785,
29
+ "precision_at_5": 0.13673,
30
+ "recall_at_1": 0.13568,
31
+ "recall_at_10": 0.37133,
32
+ "recall_at_100": 0.61475,
33
+ "recall_at_1000": 0.84372,
34
+ "recall_at_3": 0.24112,
35
+ "recall_at_5": 0.29507
36
+ }
37
+ }
evaluation/mteb/HotpotQA.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 13678.13,
6
+ "map_at_1": 0.30878,
7
+ "map_at_10": 0.40868,
8
+ "map_at_100": 0.41694,
9
+ "map_at_1000": 0.41775,
10
+ "map_at_3": 0.3856,
11
+ "map_at_5": 0.39947,
12
+ "mrr_at_1": 0.61756,
13
+ "mrr_at_10": 0.68265,
14
+ "mrr_at_100": 0.68671,
15
+ "mrr_at_1000": 0.68694,
16
+ "mrr_at_3": 0.66784,
17
+ "mrr_at_5": 0.67704,
18
+ "ndcg_at_1": 0.61756,
19
+ "ndcg_at_10": 0.49931,
20
+ "ndcg_at_100": 0.53179,
21
+ "ndcg_at_1000": 0.54948,
22
+ "ndcg_at_3": 0.46103,
23
+ "ndcg_at_5": 0.48147,
24
+ "precision_at_1": 0.61756,
25
+ "precision_at_10": 0.10163,
26
+ "precision_at_100": 0.01271,
27
+ "precision_at_1000": 0.00151,
28
+ "precision_at_3": 0.28179,
29
+ "precision_at_5": 0.18528,
30
+ "recall_at_1": 0.30878,
31
+ "recall_at_10": 0.50817,
32
+ "recall_at_100": 0.63545,
33
+ "recall_at_1000": 0.75361,
34
+ "recall_at_3": 0.42269,
35
+ "recall_at_5": 0.4632
36
+ }
37
+ }
evaluation/mteb/ImdbClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.6404799999999999,
6
+ "accuracy_stderr": 0.03197141223030349,
7
+ "ap": 0.5918525145533928,
8
+ "ap_stderr": 0.024531019346391677,
9
+ "evaluation_time": 915.58,
10
+ "f1": 0.6394712318134925,
11
+ "f1_stderr": 0.0317267000377415,
12
+ "main_score": 0.6404799999999999
13
+ }
14
+ }
evaluation/mteb/MSMARCO.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "validation": {
5
+ "evaluation_time": 22861.03,
6
+ "map_at_1": 0.189,
7
+ "map_at_10": 0.29748,
8
+ "map_at_100": 0.30976,
9
+ "map_at_1000": 0.31041,
10
+ "map_at_3": 0.26113,
11
+ "map_at_5": 0.28197,
12
+ "mrr_at_1": 0.19413,
13
+ "mrr_at_10": 0.30322,
14
+ "mrr_at_100": 0.31497,
15
+ "mrr_at_1000": 0.31555,
16
+ "mrr_at_3": 0.26729,
17
+ "mrr_at_5": 0.28789,
18
+ "ndcg_at_1": 0.19413,
19
+ "ndcg_at_10": 0.36048,
20
+ "ndcg_at_100": 0.42152,
21
+ "ndcg_at_1000": 0.43772,
22
+ "ndcg_at_3": 0.28642,
23
+ "ndcg_at_5": 0.32358,
24
+ "precision_at_1": 0.19413,
25
+ "precision_at_10": 0.05785,
26
+ "precision_at_100": 0.00887,
27
+ "precision_at_1000": 0.00103,
28
+ "precision_at_3": 0.12192,
29
+ "precision_at_5": 0.09189,
30
+ "recall_at_1": 0.189,
31
+ "recall_at_10": 0.55457,
32
+ "recall_at_100": 0.84091,
33
+ "recall_at_1000": 0.96482,
34
+ "recall_at_3": 0.35359,
35
+ "recall_at_5": 0.44275
36
+ }
37
+ }
evaluation/mteb/MTOPDomainClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.9207706338349293,
7
+ "accuracy_stderr": 0.005541106237593856,
8
+ "f1": 0.9156680443236652,
9
+ "f1_stderr": 0.005216941657420623,
10
+ "main_score": 0.9207706338349293
11
+ },
12
+ "evaluation_time": 31.37
13
+ }
14
+ }
evaluation/mteb/MTOPIntentClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.7118559051527589,
7
+ "accuracy_stderr": 0.012419016906278644,
8
+ "f1": 0.5242887061726789,
9
+ "f1_stderr": 0.011199354119349208,
10
+ "main_score": 0.7118559051527589
11
+ },
12
+ "evaluation_time": 82.02
13
+ }
14
+ }
evaluation/mteb/MassiveIntentClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.6864828513786148,
7
+ "accuracy_stderr": 0.012244395475104431,
8
+ "f1": 0.6654281381596097,
9
+ "f1_stderr": 0.009337695311493243,
10
+ "main_score": 0.6864828513786148
11
+ },
12
+ "evaluation_time": 49.93
13
+ }
14
+ }
evaluation/mteb/MassiveScenarioClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.7604236718224613,
7
+ "accuracy_stderr": 0.009702648067132833,
8
+ "f1": 0.7589170458655639,
9
+ "f1_stderr": 0.009666037600064457,
10
+ "main_score": 0.7604236718224613
11
+ },
12
+ "evaluation_time": 29.65
13
+ }
14
+ }
evaluation/mteb/MedrxivClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1694.42,
6
+ "v_measure": 0.320840369055247,
7
+ "v_measure_std": 0.012975340075124157
8
+ }
9
+ }
evaluation/mteb/MedrxivClusteringS2S.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 258.59,
6
+ "v_measure": 0.29448729560244535,
7
+ "v_measure_std": 0.014610308837145732
8
+ }
9
+ }
evaluation/mteb/MindSmallReranking.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 18115.54,
6
+ "map": 0.31340856463122374,
7
+ "mrr": 0.32398547669840916
8
+ }
9
+ }
evaluation/mteb/NFCorpus.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 101.25,
6
+ "map_at_1": 0.05526,
7
+ "map_at_10": 0.11745,
8
+ "map_at_100": 0.14831,
9
+ "map_at_1000": 0.16235,
10
+ "map_at_3": 0.08716,
11
+ "map_at_5": 0.10101,
12
+ "mrr_at_1": 0.43653,
13
+ "mrr_at_10": 0.51067,
14
+ "mrr_at_100": 0.51881,
15
+ "mrr_at_1000": 0.51912,
16
+ "mrr_at_3": 0.4902,
17
+ "mrr_at_5": 0.50289,
18
+ "ndcg_at_1": 0.4195,
19
+ "ndcg_at_10": 0.32083,
20
+ "ndcg_at_100": 0.3005,
21
+ "ndcg_at_1000": 0.38661,
22
+ "ndcg_at_3": 0.3794,
23
+ "ndcg_at_5": 0.35456,
24
+ "precision_at_1": 0.43344,
25
+ "precision_at_10": 0.23437,
26
+ "precision_at_100": 0.0783,
27
+ "precision_at_1000": 0.02053,
28
+ "precision_at_3": 0.35501,
29
+ "precision_at_5": 0.30464,
30
+ "recall_at_1": 0.05526,
31
+ "recall_at_10": 0.15446,
32
+ "recall_at_100": 0.31179,
33
+ "recall_at_1000": 0.61578,
34
+ "recall_at_3": 0.0971,
35
+ "recall_at_5": 0.12026
36
+ }
37
+ }
evaluation/mteb/NQ.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 8091.11,
6
+ "map_at_1": 0.23467,
7
+ "map_at_10": 0.36041,
8
+ "map_at_100": 0.37268,
9
+ "map_at_1000": 0.37322,
10
+ "map_at_3": 0.3209,
11
+ "map_at_5": 0.34414,
12
+ "mrr_at_1": 0.26738,
13
+ "mrr_at_10": 0.38665,
14
+ "mrr_at_100": 0.3964,
15
+ "mrr_at_1000": 0.39681,
16
+ "mrr_at_3": 0.35207,
17
+ "mrr_at_5": 0.3731,
18
+ "ndcg_at_1": 0.26709,
19
+ "ndcg_at_10": 0.42942,
20
+ "ndcg_at_100": 0.48296,
21
+ "ndcg_at_1000": 0.49651,
22
+ "ndcg_at_3": 0.35413,
23
+ "ndcg_at_5": 0.39368,
24
+ "precision_at_1": 0.26709,
25
+ "precision_at_10": 0.07306,
26
+ "precision_at_100": 0.01029,
27
+ "precision_at_1000": 0.00116,
28
+ "precision_at_3": 0.16348,
29
+ "precision_at_5": 0.12068,
30
+ "recall_at_1": 0.23467,
31
+ "recall_at_10": 0.61493,
32
+ "recall_at_100": 0.85011,
33
+ "recall_at_1000": 0.95261,
34
+ "recall_at_3": 0.41952,
35
+ "recall_at_5": 0.51106
36
+ }
37
+ }
evaluation/mteb/QuoraRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 742.32,
6
+ "map_at_1": 0.67517,
7
+ "map_at_10": 0.81054,
8
+ "map_at_100": 0.81727,
9
+ "map_at_1000": 0.81752,
10
+ "map_at_3": 0.78018,
11
+ "map_at_5": 0.79879,
12
+ "mrr_at_1": 0.7752,
13
+ "mrr_at_10": 0.84429,
14
+ "mrr_at_100": 0.84582,
15
+ "mrr_at_1000": 0.84584,
16
+ "mrr_at_3": 0.83268,
17
+ "mrr_at_5": 0.84013,
18
+ "ndcg_at_1": 0.7753,
19
+ "ndcg_at_10": 0.85277,
20
+ "ndcg_at_100": 0.86805,
21
+ "ndcg_at_1000": 0.8701,
22
+ "ndcg_at_3": 0.81975,
23
+ "ndcg_at_5": 0.83723,
24
+ "precision_at_1": 0.7753,
25
+ "precision_at_10": 0.12961,
26
+ "precision_at_100": 0.01502,
27
+ "precision_at_1000": 0.00156,
28
+ "precision_at_3": 0.35713,
29
+ "precision_at_5": 0.23574,
30
+ "recall_at_1": 0.67517,
31
+ "recall_at_10": 0.93486,
32
+ "recall_at_100": 0.989,
33
+ "recall_at_1000": 0.9993,
34
+ "recall_at_3": 0.8418,
35
+ "recall_at_5": 0.88975
36
+ }
37
+ }
evaluation/mteb/RedditClustering.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 3324.44,
6
+ "v_measure": 0.48225994608749917,
7
+ "v_measure_std": 0.055941572162319216
8
+ }
9
+ }
evaluation/mteb/RedditClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 13390.64,
6
+ "v_measure": 0.5317635557157765,
7
+ "v_measure_std": 0.12570620726605897
8
+ }
9
+ }
evaluation/mteb/SCIDOCS.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 214.39,
6
+ "map_at_1": 0.03988,
7
+ "map_at_10": 0.094,
8
+ "map_at_100": 0.10968,
9
+ "map_at_1000": 0.11257,
10
+ "map_at_3": 0.07123,
11
+ "map_at_5": 0.08221,
12
+ "mrr_at_1": 0.197,
13
+ "mrr_at_10": 0.29098,
14
+ "mrr_at_100": 0.30247,
15
+ "mrr_at_1000": 0.30318,
16
+ "mrr_at_3": 0.2655,
17
+ "mrr_at_5": 0.27915,
18
+ "ndcg_at_1": 0.197,
19
+ "ndcg_at_10": 0.16176,
20
+ "ndcg_at_100": 0.22931,
21
+ "ndcg_at_1000": 0.28301,
22
+ "ndcg_at_3": 0.16142,
23
+ "ndcg_at_5": 0.13634,
24
+ "precision_at_1": 0.197,
25
+ "precision_at_10": 0.0818,
26
+ "precision_at_100": 0.01801,
27
+ "precision_at_1000": 0.00309,
28
+ "precision_at_3": 0.151,
29
+ "precision_at_5": 0.1174,
30
+ "recall_at_1": 0.03988,
31
+ "recall_at_10": 0.16625,
32
+ "recall_at_100": 0.3661,
33
+ "recall_at_1000": 0.62805,
34
+ "recall_at_3": 0.09168,
35
+ "recall_at_5": 0.11902
36
+ }
37
+ }
evaluation/mteb/SGPT-1.3B-weightedmean-msmarco-specb-bitfit_results.csv ADDED
@@ -0,0 +1,355 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,task,dataset,language,metric,value
2
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,BitextMining,BUCC,,f1,
3
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,BitextMining,Tatoeba,,f1,
4
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en,accuracy,0.652089552238806
5
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
6
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
7
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
8
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
9
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
10
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
11
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonPolarityClassification,en,accuracy,0.7320565
12
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,en,accuracy,0.34956
13
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
14
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
15
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
16
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
17
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
18
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
19
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
20
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
21
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
22
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
23
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,Banking77Classification,en,accuracy,0.8205844155844156
24
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,EmotionClassification,en,accuracy,0.46390000000000003
25
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,ImdbClassification,en,accuracy,0.6404799999999999
26
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
27
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
28
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
29
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
30
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
31
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
32
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
33
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
34
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
35
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
36
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
37
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
38
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
39
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
40
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
41
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
42
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
43
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
44
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,en,accuracy,0.6864828513786148
45
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
46
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
47
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
48
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
49
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
50
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
51
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
52
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
53
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
54
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
55
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
56
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
57
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
58
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
59
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
60
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
61
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
62
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
63
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
64
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
65
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
66
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
67
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
68
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
69
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
70
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
71
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
72
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
73
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
74
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
75
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
76
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
77
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
78
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
79
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
80
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
81
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
82
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
83
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
84
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
85
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
86
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
87
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
88
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
89
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
90
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
91
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
92
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
93
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
94
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
95
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
96
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
97
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
98
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
99
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
100
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
101
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
102
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
103
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
104
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
105
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
106
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
107
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
108
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
109
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
110
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
111
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
112
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
113
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
114
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
115
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
116
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
117
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
118
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
119
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
120
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
121
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
122
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
123
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
124
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
125
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
126
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
127
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
128
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
129
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
130
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
131
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
132
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
133
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
134
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
135
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
136
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
137
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
138
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
139
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
140
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
141
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
142
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
143
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
144
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
145
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,en,accuracy,0.7604236718224613
146
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
147
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
148
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
149
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
150
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
151
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
152
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
153
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
154
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
155
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
156
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
157
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
158
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
159
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
160
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
161
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
162
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
163
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
164
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
165
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
166
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
167
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
168
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
169
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
170
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
171
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
172
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
173
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
174
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
175
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
176
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
177
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
178
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
179
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
180
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
181
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
182
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
183
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
184
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
185
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
186
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
187
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
188
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
189
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
190
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
191
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
192
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
193
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
194
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
195
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
196
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
197
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
198
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
199
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
200
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
201
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
202
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
203
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
204
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
205
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
206
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
207
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
208
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
209
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
210
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
211
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
212
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
213
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
214
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
215
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
216
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
217
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
218
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
219
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
220
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
221
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
222
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
223
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
224
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
225
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
226
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
227
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
228
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,en,accuracy,0.9207706338349293
229
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
230
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
231
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
232
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
233
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
234
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
235
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
236
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
237
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
238
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
239
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,en,accuracy,0.7118559051527589
240
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
241
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
242
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
243
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
244
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
245
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
246
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
247
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
248
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
249
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
250
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,ToxicConversationsClassification,en,accuracy,0.687272
251
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,TweetSentimentExtractionClassification,en,accuracy,0.556677985285795
252
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringP2P,en,v_measure,0.4338419491695377
253
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringS2S,en,v_measure,0.3370962633433912
254
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringP2P,en,v_measure,0.3505918333141837
255
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringS2S,en,v_measure,0.3071055028830579
256
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringP2P,en,v_measure,0.320840369055247
257
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringS2S,en,v_measure,0.29448729560244535
258
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClustering,en,v_measure,0.48225994608749917
259
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClusteringP2P,en,v_measure,0.5317635557157765
260
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClustering,en,v_measure,0.6085593925770172
261
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClusteringP2P,en,v_measure,0.323567729982375
262
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,TwentyNewsgroupsClustering,en,v_measure,0.4005809562275603
263
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,SprintDuplicateQuestions,en,ap,0.9257836032673468
264
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterSemEval2015,en,ap,0.6237052608803734
265
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterURLCorpus,en,ap,0.8378748636891035
266
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,AskUbuntuDupQuestions,en,map,0.5813305899687008
267
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,MindSmallReranking,en,map,0.31340856463122374
268
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,SciDocsRR,en,map,0.7721233007730808
269
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,StackOverflowDupQuestions,en,map,0.49320607035290737
270
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,ArguAna,en,ndcg_at_10,0.4968
271
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,ClimateFEVER,en,ndcg_at_10,0.26595
272
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,CQADupstackRetrieval,en,ndcg_at_10,0.3332616666666667
273
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,DBPedia,en,ndcg_at_10,0.31507
274
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,FEVER,en,ndcg_at_10,0.6812
275
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,FiQA2018,en,ndcg_at_10,0.29988
276
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,HotpotQA,en,ndcg_at_10,0.49931
277
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,MSMARCO,en,ndcg_at_10,0.36048
278
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,NFCorpus,en,ndcg_at_10,0.32083
279
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,NQ,en,ndcg_at_10,0.42942
280
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,QuoraRetrieval,en,ndcg_at_10,0.85277
281
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,SCIDOCS,en,ndcg_at_10,0.16176
282
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,SciFact,en,ndcg_at_10,0.68287
283
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,Touche2020,en,ndcg_at_10,0.2445
284
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,TRECCOVID,en,ndcg_at_10,0.7298
285
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,BIOSSES,en,cosine_spearman,0.8301514456843275
286
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,SICK-R,en,cosine_spearman,0.6722953551111448
287
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS12,en,cosine_spearman,0.6659241013465915
288
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS13,en,cosine_spearman,0.7733151317062642
289
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS14,en,cosine_spearman,0.7182815265534886
290
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS15,en,cosine_spearman,0.8065931167868883
291
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS16,en,cosine_spearman,0.7891151365939403
292
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
293
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
294
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
295
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
296
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
297
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
298
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
299
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
300
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-en,cosine_spearman,0.8698674844768606
301
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
302
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
303
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
304
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
305
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
306
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
307
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
308
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
309
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
310
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
311
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
312
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
313
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,en,cosine_spearman,0.6730387805090023
314
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
315
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
316
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
317
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
318
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
319
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
320
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
321
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
322
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
323
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
324
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
325
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
326
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
327
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
328
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
329
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
330
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
331
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
332
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
333
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
334
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
335
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
336
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
337
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
338
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
339
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
340
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
341
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
342
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
343
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
344
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
345
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
346
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
347
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
348
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STSBenchmark,en,cosine_spearman,0.775887175717799
349
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Summarization,SummEval,en,cosine_spearman,0.25440272876996695
350
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,average,en,accuracy,0.6651794596081484
351
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,average,en,v_measure,0.3991540721780082
352
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,average,en,ap,0.7957879092789413
353
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,average,en,map,0.5400171314314782
354
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,average,en,ndcg_at_10,0.4449267777777778
355
+ SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,average,en,cosine_spearman,0.7574469254486307
evaluation/mteb/SICK-R.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.7729330379162072,
7
+ "spearman": 0.6722953551111448
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.7144682700059415,
11
+ "spearman": 0.6633178012153248
12
+ },
13
+ "evaluation_time": 52.38,
14
+ "manhattan": {
15
+ "pearson": 0.7146941734657887,
16
+ "spearman": 0.6643234359835815
17
+ }
18
+ }
19
+ }
evaluation/mteb/STS12.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.7540943196466576,
7
+ "spearman": 0.6659241013465915
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.7132500540796616,
11
+ "spearman": 0.6786667467202591
12
+ },
13
+ "evaluation_time": 26.18,
14
+ "manhattan": {
15
+ "pearson": 0.7148209832089134,
16
+ "spearman": 0.6794511626964879
17
+ }
18
+ }
19
+ }
evaluation/mteb/STS13.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.7708302398877518,
7
+ "spearman": 0.7733151317062642
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.7677020279715008,
11
+ "spearman": 0.7713893776083225
12
+ },
13
+ "evaluation_time": 12.09,
14
+ "manhattan": {
15
+ "pearson": 0.7676732290707478,
16
+ "spearman": 0.7714500877396631
17
+ }
18
+ }
19
+ }