Commit
·
5d4e702
1
Parent(s):
7853d0d
Add MTEB evaluation
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- {eval → evaluation/beir}/beir.json +0 -0
- evaluation/mteb/AmazonCounterfactualClassification.json +16 -0
- evaluation/mteb/AmazonPolarityClassification.json +14 -0
- evaluation/mteb/AmazonReviewsClassification.json +14 -0
- evaluation/mteb/ArguAna.json +37 -0
- evaluation/mteb/ArxivClusteringP2P.json +9 -0
- evaluation/mteb/ArxivClusteringS2S.json +9 -0
- evaluation/mteb/AskUbuntuDupQuestions.json +9 -0
- evaluation/mteb/BIOSSES.json +19 -0
- evaluation/mteb/Banking77Classification.json +12 -0
- evaluation/mteb/BiorxivClusteringP2P.json +9 -0
- evaluation/mteb/BiorxivClusteringS2S.json +9 -0
- evaluation/mteb/CQADupstackAndroidRetrieval.json +37 -0
- evaluation/mteb/CQADupstackEnglishRetrieval.json +37 -0
- evaluation/mteb/CQADupstackGamingRetrieval.json +37 -0
- evaluation/mteb/CQADupstackGisRetrieval.json +37 -0
- evaluation/mteb/CQADupstackMathematicaRetrieval.json +37 -0
- evaluation/mteb/CQADupstackPhysicsRetrieval.json +37 -0
- evaluation/mteb/CQADupstackProgrammersRetrieval.json +37 -0
- evaluation/mteb/CQADupstackRetrieval.json +1 -0
- evaluation/mteb/CQADupstackStatsRetrieval.json +37 -0
- evaluation/mteb/CQADupstackTexRetrieval.json +37 -0
- evaluation/mteb/CQADupstackUnixRetrieval.json +37 -0
- evaluation/mteb/CQADupstackWebmastersRetrieval.json +37 -0
- evaluation/mteb/CQADupstackWordpressRetrieval.json +37 -0
- evaluation/mteb/ClimateFEVER.json +37 -0
- evaluation/mteb/DBPedia.json +37 -0
- evaluation/mteb/EmotionClassification.json +12 -0
- evaluation/mteb/FEVER.json +37 -0
- evaluation/mteb/FiQA2018.json +37 -0
- evaluation/mteb/HotpotQA.json +37 -0
- evaluation/mteb/ImdbClassification.json +14 -0
- evaluation/mteb/MSMARCO.json +37 -0
- evaluation/mteb/MTOPDomainClassification.json +14 -0
- evaluation/mteb/MTOPIntentClassification.json +14 -0
- evaluation/mteb/MassiveIntentClassification.json +14 -0
- evaluation/mteb/MassiveScenarioClassification.json +14 -0
- evaluation/mteb/MedrxivClusteringP2P.json +9 -0
- evaluation/mteb/MedrxivClusteringS2S.json +9 -0
- evaluation/mteb/MindSmallReranking.json +9 -0
- evaluation/mteb/NFCorpus.json +37 -0
- evaluation/mteb/NQ.json +37 -0
- evaluation/mteb/QuoraRetrieval.json +37 -0
- evaluation/mteb/RedditClustering.json +9 -0
- evaluation/mteb/RedditClusteringP2P.json +9 -0
- evaluation/mteb/SCIDOCS.json +37 -0
- evaluation/mteb/SGPT-1.3B-weightedmean-msmarco-specb-bitfit_results.csv +355 -0
- evaluation/mteb/SICK-R.json +19 -0
- evaluation/mteb/STS12.json +19 -0
- evaluation/mteb/STS13.json +19 -0
{eval → evaluation/beir}/beir.json
RENAMED
File without changes
|
evaluation/mteb/AmazonCounterfactualClassification.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.652089552238806,
|
7 |
+
"accuracy_stderr": 0.04707742824740793,
|
8 |
+
"ap": 0.2959212705444778,
|
9 |
+
"ap_stderr": 0.022393345886320606,
|
10 |
+
"f1": 0.5997099864321921,
|
11 |
+
"f1_stderr": 0.036697739411917986,
|
12 |
+
"main_score": 0.652089552238806
|
13 |
+
},
|
14 |
+
"evaluation_time": 23.71
|
15 |
+
}
|
16 |
+
}
|
evaluation/mteb/AmazonPolarityClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.7320565,
|
6 |
+
"accuracy_stderr": 0.04094219950430119,
|
7 |
+
"ap": 0.6736680643550963,
|
8 |
+
"ap_stderr": 0.03652809962256317,
|
9 |
+
"evaluation_time": 7801.59,
|
10 |
+
"f1": 0.7290420520325125,
|
11 |
+
"f1_stderr": 0.04396494850187113,
|
12 |
+
"main_score": 0.7320565
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/AmazonReviewsClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.34956,
|
7 |
+
"accuracy_stderr": 0.018705464442242543,
|
8 |
+
"f1": 0.3471932443769695,
|
9 |
+
"f1_stderr": 0.017698150667922033,
|
10 |
+
"main_score": 0.34956
|
11 |
+
},
|
12 |
+
"evaluation_time": 73.75
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/ArguAna.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 159.23,
|
6 |
+
"map_at_1": 0.26102,
|
7 |
+
"map_at_10": 0.40958,
|
8 |
+
"map_at_100": 0.42033,
|
9 |
+
"map_at_1000": 0.42042,
|
10 |
+
"map_at_3": 0.36332,
|
11 |
+
"map_at_5": 0.38608,
|
12 |
+
"mrr_at_1": 0.26387,
|
13 |
+
"mrr_at_10": 0.41051,
|
14 |
+
"mrr_at_100": 0.42118,
|
15 |
+
"mrr_at_1000": 0.42127,
|
16 |
+
"mrr_at_3": 0.36415,
|
17 |
+
"mrr_at_5": 0.3872,
|
18 |
+
"ndcg_at_1": 0.26102,
|
19 |
+
"ndcg_at_10": 0.4968,
|
20 |
+
"ndcg_at_100": 0.54258,
|
21 |
+
"ndcg_at_1000": 0.54486,
|
22 |
+
"ndcg_at_3": 0.39864,
|
23 |
+
"ndcg_at_5": 0.4398,
|
24 |
+
"precision_at_1": 0.26102,
|
25 |
+
"precision_at_10": 0.07781,
|
26 |
+
"precision_at_100": 0.00979,
|
27 |
+
"precision_at_1000": 0.001,
|
28 |
+
"precision_at_3": 0.16714,
|
29 |
+
"precision_at_5": 0.12034,
|
30 |
+
"recall_at_1": 0.26102,
|
31 |
+
"recall_at_10": 0.77809,
|
32 |
+
"recall_at_100": 0.97866,
|
33 |
+
"recall_at_1000": 0.99644,
|
34 |
+
"recall_at_3": 0.50142,
|
35 |
+
"recall_at_5": 0.60171
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/ArxivClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 28476.56,
|
6 |
+
"v_measure": 0.4338419491695377,
|
7 |
+
"v_measure_std": 0.13772932292188322
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/ArxivClusteringS2S.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 3597.82,
|
6 |
+
"v_measure": 0.3370962633433912,
|
7 |
+
"v_measure_std": 0.14057785790111033
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/AskUbuntuDupQuestions.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 29.27,
|
6 |
+
"map": 0.5813305899687008,
|
7 |
+
"mrr": 0.7210922041946972
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/BIOSSES.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.8662153841660047,
|
7 |
+
"spearman": 0.8301514456843275
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.8600431518427242,
|
11 |
+
"spearman": 0.8385552516285784
|
12 |
+
},
|
13 |
+
"evaluation_time": 4.47,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.8583025803351181,
|
16 |
+
"spearman": 0.8386636878343106
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|
evaluation/mteb/Banking77Classification.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.8205844155844156,
|
6 |
+
"accuracy_stderr": 0.00898031054024437,
|
7 |
+
"evaluation_time": 70.71,
|
8 |
+
"f1": 0.8201858378847641,
|
9 |
+
"f1_stderr": 0.009423967637409204,
|
10 |
+
"main_score": 0.8205844155844156
|
11 |
+
}
|
12 |
+
}
|
evaluation/mteb/BiorxivClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 3352.83,
|
6 |
+
"v_measure": 0.3505918333141837,
|
7 |
+
"v_measure_std": 0.00847894603883707
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/BiorxivClusteringS2S.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 435.49,
|
6 |
+
"v_measure": 0.3071055028830579,
|
7 |
+
"v_measure_std": 0.008981834294010968
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/CQADupstackAndroidRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 575.19,
|
6 |
+
"map_at_1": 0.26519,
|
7 |
+
"map_at_10": 0.35634,
|
8 |
+
"map_at_100": 0.36961,
|
9 |
+
"map_at_1000": 0.37088,
|
10 |
+
"map_at_3": 0.32254,
|
11 |
+
"map_at_5": 0.3422,
|
12 |
+
"mrr_at_1": 0.32332,
|
13 |
+
"mrr_at_10": 0.41168,
|
14 |
+
"mrr_at_100": 0.41977,
|
15 |
+
"mrr_at_1000": 0.42029,
|
16 |
+
"mrr_at_3": 0.38197,
|
17 |
+
"mrr_at_5": 0.40036,
|
18 |
+
"ndcg_at_1": 0.32332,
|
19 |
+
"ndcg_at_10": 0.41471,
|
20 |
+
"ndcg_at_100": 0.46956,
|
21 |
+
"ndcg_at_1000": 0.49262,
|
22 |
+
"ndcg_at_3": 0.35938,
|
23 |
+
"ndcg_at_5": 0.38703,
|
24 |
+
"precision_at_1": 0.32332,
|
25 |
+
"precision_at_10": 0.07783,
|
26 |
+
"precision_at_100": 0.0129,
|
27 |
+
"precision_at_1000": 0.00178,
|
28 |
+
"precision_at_3": 0.16834,
|
29 |
+
"precision_at_5": 0.12418,
|
30 |
+
"recall_at_1": 0.26519,
|
31 |
+
"recall_at_10": 0.5319,
|
32 |
+
"recall_at_100": 0.76565,
|
33 |
+
"recall_at_1000": 0.91478,
|
34 |
+
"recall_at_3": 0.38034,
|
35 |
+
"recall_at_5": 0.45246
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackEnglishRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 874.22,
|
6 |
+
"map_at_1": 0.25356,
|
7 |
+
"map_at_10": 0.34596,
|
8 |
+
"map_at_100": 0.35714,
|
9 |
+
"map_at_1000": 0.3584,
|
10 |
+
"map_at_3": 0.32073,
|
11 |
+
"map_at_5": 0.33475,
|
12 |
+
"mrr_at_1": 0.31274,
|
13 |
+
"mrr_at_10": 0.39592,
|
14 |
+
"mrr_at_100": 0.40284,
|
15 |
+
"mrr_at_1000": 0.4034,
|
16 |
+
"mrr_at_3": 0.37378,
|
17 |
+
"mrr_at_5": 0.38658,
|
18 |
+
"ndcg_at_1": 0.31274,
|
19 |
+
"ndcg_at_10": 0.39766,
|
20 |
+
"ndcg_at_100": 0.44028,
|
21 |
+
"ndcg_at_1000": 0.46445,
|
22 |
+
"ndcg_at_3": 0.35934,
|
23 |
+
"ndcg_at_5": 0.37751,
|
24 |
+
"precision_at_1": 0.31274,
|
25 |
+
"precision_at_10": 0.07452,
|
26 |
+
"precision_at_100": 0.01217,
|
27 |
+
"precision_at_1000": 0.0017,
|
28 |
+
"precision_at_3": 0.17431,
|
29 |
+
"precision_at_5": 0.12306,
|
30 |
+
"recall_at_1": 0.25356,
|
31 |
+
"recall_at_10": 0.49344,
|
32 |
+
"recall_at_100": 0.67497,
|
33 |
+
"recall_at_1000": 0.83372,
|
34 |
+
"recall_at_3": 0.38227,
|
35 |
+
"recall_at_5": 0.43188
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackGamingRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 931.63,
|
6 |
+
"map_at_1": 0.32759,
|
7 |
+
"map_at_10": 0.43937,
|
8 |
+
"map_at_100": 0.45004,
|
9 |
+
"map_at_1000": 0.4507,
|
10 |
+
"map_at_3": 0.40805,
|
11 |
+
"map_at_5": 0.42497,
|
12 |
+
"mrr_at_1": 0.37367,
|
13 |
+
"mrr_at_10": 0.47237,
|
14 |
+
"mrr_at_100": 0.47973,
|
15 |
+
"mrr_at_1000": 0.48011,
|
16 |
+
"mrr_at_3": 0.4465,
|
17 |
+
"mrr_at_5": 0.46051,
|
18 |
+
"ndcg_at_1": 0.37367,
|
19 |
+
"ndcg_at_10": 0.49659,
|
20 |
+
"ndcg_at_100": 0.54069,
|
21 |
+
"ndcg_at_1000": 0.55552,
|
22 |
+
"ndcg_at_3": 0.44169,
|
23 |
+
"ndcg_at_5": 0.46726,
|
24 |
+
"precision_at_1": 0.37367,
|
25 |
+
"precision_at_10": 0.08163,
|
26 |
+
"precision_at_100": 0.01133,
|
27 |
+
"precision_at_1000": 0.00131,
|
28 |
+
"precision_at_3": 0.19707,
|
29 |
+
"precision_at_5": 0.13718,
|
30 |
+
"recall_at_1": 0.32759,
|
31 |
+
"recall_at_10": 0.63341,
|
32 |
+
"recall_at_100": 0.82502,
|
33 |
+
"recall_at_1000": 0.93259,
|
34 |
+
"recall_at_3": 0.48796,
|
35 |
+
"recall_at_5": 0.54921
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackGisRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1290.88,
|
6 |
+
"map_at_1": 0.18962,
|
7 |
+
"map_at_10": 0.25863,
|
8 |
+
"map_at_100": 0.26818,
|
9 |
+
"map_at_1000": 0.26918,
|
10 |
+
"map_at_3": 0.23043,
|
11 |
+
"map_at_5": 0.24599,
|
12 |
+
"mrr_at_1": 0.20452,
|
13 |
+
"mrr_at_10": 0.27301,
|
14 |
+
"mrr_at_100": 0.28233,
|
15 |
+
"mrr_at_1000": 0.2831,
|
16 |
+
"mrr_at_3": 0.24539,
|
17 |
+
"mrr_at_5": 0.26109,
|
18 |
+
"ndcg_at_1": 0.20452,
|
19 |
+
"ndcg_at_10": 0.30355,
|
20 |
+
"ndcg_at_100": 0.35336,
|
21 |
+
"ndcg_at_1000": 0.37927,
|
22 |
+
"ndcg_at_3": 0.24705,
|
23 |
+
"ndcg_at_5": 0.2742,
|
24 |
+
"precision_at_1": 0.20452,
|
25 |
+
"precision_at_10": 0.04949,
|
26 |
+
"precision_at_100": 0.0078,
|
27 |
+
"precision_at_1000": 0.00104,
|
28 |
+
"precision_at_3": 0.10358,
|
29 |
+
"precision_at_5": 0.07774,
|
30 |
+
"recall_at_1": 0.18962,
|
31 |
+
"recall_at_10": 0.43056,
|
32 |
+
"recall_at_100": 0.66273,
|
33 |
+
"recall_at_1000": 0.8596,
|
34 |
+
"recall_at_3": 0.27776,
|
35 |
+
"recall_at_5": 0.34287
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackMathematicaRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 686.89,
|
6 |
+
"map_at_1": 0.1124,
|
7 |
+
"map_at_10": 0.18503,
|
8 |
+
"map_at_100": 0.19553,
|
9 |
+
"map_at_1000": 0.1969,
|
10 |
+
"map_at_3": 0.1615,
|
11 |
+
"map_at_5": 0.17254,
|
12 |
+
"mrr_at_1": 0.13806,
|
13 |
+
"mrr_at_10": 0.21939,
|
14 |
+
"mrr_at_100": 0.22827,
|
15 |
+
"mrr_at_1000": 0.22911,
|
16 |
+
"mrr_at_3": 0.1932,
|
17 |
+
"mrr_at_5": 0.20558,
|
18 |
+
"ndcg_at_1": 0.13806,
|
19 |
+
"ndcg_at_10": 0.23383,
|
20 |
+
"ndcg_at_100": 0.28834,
|
21 |
+
"ndcg_at_1000": 0.32175,
|
22 |
+
"ndcg_at_3": 0.18652,
|
23 |
+
"ndcg_at_5": 0.20505,
|
24 |
+
"precision_at_1": 0.13806,
|
25 |
+
"precision_at_10": 0.04714,
|
26 |
+
"precision_at_100": 0.00864,
|
27 |
+
"precision_at_1000": 0.0013,
|
28 |
+
"precision_at_3": 0.09328,
|
29 |
+
"precision_at_5": 0.06841,
|
30 |
+
"recall_at_1": 0.1124,
|
31 |
+
"recall_at_10": 0.34854,
|
32 |
+
"recall_at_100": 0.59503,
|
33 |
+
"recall_at_1000": 0.8325,
|
34 |
+
"recall_at_3": 0.2202,
|
35 |
+
"recall_at_5": 0.26715
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackPhysicsRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1269.26,
|
6 |
+
"map_at_1": 0.23012,
|
7 |
+
"map_at_10": 0.33048,
|
8 |
+
"map_at_100": 0.34371,
|
9 |
+
"map_at_1000": 0.34489,
|
10 |
+
"map_at_3": 0.29943,
|
11 |
+
"map_at_5": 0.31602,
|
12 |
+
"mrr_at_1": 0.28104,
|
13 |
+
"mrr_at_10": 0.3799,
|
14 |
+
"mrr_at_100": 0.38836,
|
15 |
+
"mrr_at_1000": 0.38891,
|
16 |
+
"mrr_at_3": 0.35226,
|
17 |
+
"mrr_at_5": 0.36694,
|
18 |
+
"ndcg_at_1": 0.28104,
|
19 |
+
"ndcg_at_10": 0.39037,
|
20 |
+
"ndcg_at_100": 0.44643,
|
21 |
+
"ndcg_at_1000": 0.46939,
|
22 |
+
"ndcg_at_3": 0.33784,
|
23 |
+
"ndcg_at_5": 0.36126,
|
24 |
+
"precision_at_1": 0.28104,
|
25 |
+
"precision_at_10": 0.07267,
|
26 |
+
"precision_at_100": 0.01193,
|
27 |
+
"precision_at_1000": 0.00159,
|
28 |
+
"precision_at_3": 0.16298,
|
29 |
+
"precision_at_5": 0.11684,
|
30 |
+
"recall_at_1": 0.23012,
|
31 |
+
"recall_at_10": 0.52054,
|
32 |
+
"recall_at_100": 0.75622,
|
33 |
+
"recall_at_1000": 0.90675,
|
34 |
+
"recall_at_3": 0.37282,
|
35 |
+
"recall_at_5": 0.43307
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackProgrammersRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1185.95,
|
6 |
+
"map_at_1": 0.21624,
|
7 |
+
"map_at_10": 0.3021,
|
8 |
+
"map_at_100": 0.3152,
|
9 |
+
"map_at_1000": 0.31626,
|
10 |
+
"map_at_3": 0.26951,
|
11 |
+
"map_at_5": 0.28939,
|
12 |
+
"mrr_at_1": 0.26941,
|
13 |
+
"mrr_at_10": 0.3513,
|
14 |
+
"mrr_at_100": 0.3615,
|
15 |
+
"mrr_at_1000": 0.36204,
|
16 |
+
"mrr_at_3": 0.3242,
|
17 |
+
"mrr_at_5": 0.34155,
|
18 |
+
"ndcg_at_1": 0.26941,
|
19 |
+
"ndcg_at_10": 0.35726,
|
20 |
+
"ndcg_at_100": 0.41725,
|
21 |
+
"ndcg_at_1000": 0.44105,
|
22 |
+
"ndcg_at_3": 0.30184,
|
23 |
+
"ndcg_at_5": 0.33176,
|
24 |
+
"precision_at_1": 0.26941,
|
25 |
+
"precision_at_10": 0.06655,
|
26 |
+
"precision_at_100": 0.01152,
|
27 |
+
"precision_at_1000": 0.00152,
|
28 |
+
"precision_at_3": 0.14346,
|
29 |
+
"precision_at_5": 0.10868,
|
30 |
+
"recall_at_1": 0.21624,
|
31 |
+
"recall_at_10": 0.47359,
|
32 |
+
"recall_at_100": 0.73436,
|
33 |
+
"recall_at_1000": 0.89988,
|
34 |
+
"recall_at_3": 0.3234,
|
35 |
+
"recall_at_5": 0.39856
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackRetrieval.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"dataset_version": null, "mteb_version": "0.0.2", "test": {"evaluation_time": 1798.61, "map_at_1": 0.2067566666666667, "map_at_10": 0.28479333333333334, "map_at_100": 0.29612249999999996, "map_at_1000": 0.29731166666666664, "map_at_3": 0.25884, "map_at_5": 0.27298916666666667, "mrr_at_1": 0.24402583333333333, "mrr_at_10": 0.3207041666666667, "mrr_at_100": 0.32958416666666673, "mrr_at_1000": 0.3302541666666666, "mrr_at_3": 0.29677749999999997, "mrr_at_5": 0.3102391666666667, "ndcg_at_1": 0.24402583333333333, "ndcg_at_10": 0.3332616666666667, "ndcg_at_100": 0.38515666666666665, "ndcg_at_1000": 0.4113791666666667, "ndcg_at_3": 0.28687749999999995, "ndcg_at_5": 0.3084766666666667, "precision_at_1": 0.24402583333333333, "precision_at_10": 0.05943749999999999, "precision_at_100": 0.010098333333333334, "precision_at_1000": 0.0014183333333333333, "precision_at_3": 0.132115, "precision_at_5": 0.09548416666666668, "recall_at_1": 0.2067566666666667, "recall_at_10": 0.4424558333333334, "recall_at_100": 0.6731116666666667, "recall_at_1000": 0.8587841666666666, "recall_at_3": 0.3149258333333333, "recall_at_5": 0.3693241666666667}}
|
evaluation/mteb/CQADupstackStatsRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1614.26,
|
6 |
+
"map_at_1": 0.1834,
|
7 |
+
"map_at_10": 0.23988,
|
8 |
+
"map_at_100": 0.24895,
|
9 |
+
"map_at_1000": 0.24992,
|
10 |
+
"map_at_3": 0.21831,
|
11 |
+
"map_at_5": 0.23,
|
12 |
+
"mrr_at_1": 0.20399,
|
13 |
+
"mrr_at_10": 0.26186,
|
14 |
+
"mrr_at_100": 0.27018,
|
15 |
+
"mrr_at_1000": 0.27091,
|
16 |
+
"mrr_at_3": 0.2408,
|
17 |
+
"mrr_at_5": 0.2523,
|
18 |
+
"ndcg_at_1": 0.20399,
|
19 |
+
"ndcg_at_10": 0.27799,
|
20 |
+
"ndcg_at_100": 0.32579,
|
21 |
+
"ndcg_at_1000": 0.35209,
|
22 |
+
"ndcg_at_3": 0.23684,
|
23 |
+
"ndcg_at_5": 0.25521,
|
24 |
+
"precision_at_1": 0.20399,
|
25 |
+
"precision_at_10": 0.04586,
|
26 |
+
"precision_at_100": 0.00755,
|
27 |
+
"precision_at_1000": 0.00105,
|
28 |
+
"precision_at_3": 0.10276,
|
29 |
+
"precision_at_5": 0.07362,
|
30 |
+
"recall_at_1": 0.1834,
|
31 |
+
"recall_at_10": 0.37456,
|
32 |
+
"recall_at_100": 0.5986,
|
33 |
+
"recall_at_1000": 0.79703,
|
34 |
+
"recall_at_3": 0.26164,
|
35 |
+
"recall_at_5": 0.30652
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackTexRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 2711.63,
|
6 |
+
"map_at_1": 0.12327,
|
7 |
+
"map_at_10": 0.17572,
|
8 |
+
"map_at_100": 0.18534,
|
9 |
+
"map_at_1000": 0.18653,
|
10 |
+
"map_at_3": 0.15703,
|
11 |
+
"map_at_5": 0.16752,
|
12 |
+
"mrr_at_1": 0.15038,
|
13 |
+
"mrr_at_10": 0.20726,
|
14 |
+
"mrr_at_100": 0.2161,
|
15 |
+
"mrr_at_1000": 0.21695,
|
16 |
+
"mrr_at_3": 0.18829,
|
17 |
+
"mrr_at_5": 0.19885,
|
18 |
+
"ndcg_at_1": 0.15038,
|
19 |
+
"ndcg_at_10": 0.21241,
|
20 |
+
"ndcg_at_100": 0.26179,
|
21 |
+
"ndcg_at_1000": 0.29316,
|
22 |
+
"ndcg_at_3": 0.17762,
|
23 |
+
"ndcg_at_5": 0.19413,
|
24 |
+
"precision_at_1": 0.15038,
|
25 |
+
"precision_at_10": 0.03892,
|
26 |
+
"precision_at_100": 0.0075,
|
27 |
+
"precision_at_1000": 0.00118,
|
28 |
+
"precision_at_3": 0.08351,
|
29 |
+
"precision_at_5": 0.06187,
|
30 |
+
"recall_at_1": 0.12327,
|
31 |
+
"recall_at_10": 0.29342,
|
32 |
+
"recall_at_100": 0.51854,
|
33 |
+
"recall_at_1000": 0.74648,
|
34 |
+
"recall_at_3": 0.19596,
|
35 |
+
"recall_at_5": 0.23899
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackUnixRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1688.62,
|
6 |
+
"map_at_1": 0.20594,
|
7 |
+
"map_at_10": 0.27879,
|
8 |
+
"map_at_100": 0.28926,
|
9 |
+
"map_at_1000": 0.29041,
|
10 |
+
"map_at_3": 0.25669,
|
11 |
+
"map_at_5": 0.26774,
|
12 |
+
"mrr_at_1": 0.23694,
|
13 |
+
"mrr_at_10": 0.31335,
|
14 |
+
"mrr_at_100": 0.32218,
|
15 |
+
"mrr_at_1000": 0.32298,
|
16 |
+
"mrr_at_3": 0.2926,
|
17 |
+
"mrr_at_5": 0.30328,
|
18 |
+
"ndcg_at_1": 0.23694,
|
19 |
+
"ndcg_at_10": 0.32456,
|
20 |
+
"ndcg_at_100": 0.37667,
|
21 |
+
"ndcg_at_1000": 0.40571,
|
22 |
+
"ndcg_at_3": 0.28283,
|
23 |
+
"ndcg_at_5": 0.29986,
|
24 |
+
"precision_at_1": 0.23694,
|
25 |
+
"precision_at_10": 0.05448,
|
26 |
+
"precision_at_100": 0.00912,
|
27 |
+
"precision_at_1000": 0.00127,
|
28 |
+
"precision_at_3": 0.12718,
|
29 |
+
"precision_at_5": 0.08843,
|
30 |
+
"recall_at_1": 0.20594,
|
31 |
+
"recall_at_10": 0.43005,
|
32 |
+
"recall_at_100": 0.66228,
|
33 |
+
"recall_at_1000": 0.87171,
|
34 |
+
"recall_at_3": 0.31554,
|
35 |
+
"recall_at_5": 0.35838
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackWebmastersRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 540.56,
|
6 |
+
"map_at_1": 0.20856,
|
7 |
+
"map_at_10": 0.28372,
|
8 |
+
"map_at_100": 0.2987,
|
9 |
+
"map_at_1000": 0.30075,
|
10 |
+
"map_at_3": 0.26054,
|
11 |
+
"map_at_5": 0.27129,
|
12 |
+
"mrr_at_1": 0.25494,
|
13 |
+
"mrr_at_10": 0.32735,
|
14 |
+
"mrr_at_100": 0.33794,
|
15 |
+
"mrr_at_1000": 0.3385,
|
16 |
+
"mrr_at_3": 0.30731,
|
17 |
+
"mrr_at_5": 0.31897,
|
18 |
+
"ndcg_at_1": 0.25494,
|
19 |
+
"ndcg_at_10": 0.33385,
|
20 |
+
"ndcg_at_100": 0.39436,
|
21 |
+
"ndcg_at_1000": 0.42313,
|
22 |
+
"ndcg_at_3": 0.29612,
|
23 |
+
"ndcg_at_5": 0.31187,
|
24 |
+
"precision_at_1": 0.25494,
|
25 |
+
"precision_at_10": 0.06423,
|
26 |
+
"precision_at_100": 0.01383,
|
27 |
+
"precision_at_1000": 0.00224,
|
28 |
+
"precision_at_3": 0.13834,
|
29 |
+
"precision_at_5": 0.1,
|
30 |
+
"recall_at_1": 0.20856,
|
31 |
+
"recall_at_10": 0.42678,
|
32 |
+
"recall_at_100": 0.70224,
|
33 |
+
"recall_at_1000": 0.89369,
|
34 |
+
"recall_at_3": 0.31957,
|
35 |
+
"recall_at_5": 0.36026
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackWordpressRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1798.61,
|
6 |
+
"map_at_1": 0.16519,
|
7 |
+
"map_at_10": 0.2215,
|
8 |
+
"map_at_100": 0.23181,
|
9 |
+
"map_at_1000": 0.23292,
|
10 |
+
"map_at_3": 0.20132,
|
11 |
+
"map_at_5": 0.21346,
|
12 |
+
"mrr_at_1": 0.1793,
|
13 |
+
"mrr_at_10": 0.23506,
|
14 |
+
"mrr_at_100": 0.24581,
|
15 |
+
"mrr_at_1000": 0.24675,
|
16 |
+
"mrr_at_3": 0.21503,
|
17 |
+
"mrr_at_5": 0.22686,
|
18 |
+
"ndcg_at_1": 0.1793,
|
19 |
+
"ndcg_at_10": 0.25636,
|
20 |
+
"ndcg_at_100": 0.30736,
|
21 |
+
"ndcg_at_1000": 0.33841,
|
22 |
+
"ndcg_at_3": 0.21546,
|
23 |
+
"ndcg_at_5": 0.23658,
|
24 |
+
"precision_at_1": 0.1793,
|
25 |
+
"precision_at_10": 0.03993,
|
26 |
+
"precision_at_100": 0.00689,
|
27 |
+
"precision_at_1000": 0.00104,
|
28 |
+
"precision_at_3": 0.09057,
|
29 |
+
"precision_at_5": 0.0658,
|
30 |
+
"recall_at_1": 0.16519,
|
31 |
+
"recall_at_10": 0.35268,
|
32 |
+
"recall_at_100": 0.5817,
|
33 |
+
"recall_at_1000": 0.81668,
|
34 |
+
"recall_at_3": 0.24165,
|
35 |
+
"recall_at_5": 0.29254
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/ClimateFEVER.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 16391.42,
|
6 |
+
"map_at_1": 0.10363,
|
7 |
+
"map_at_10": 0.18301,
|
8 |
+
"map_at_100": 0.20019,
|
9 |
+
"map_at_1000": 0.20207,
|
10 |
+
"map_at_3": 0.14877,
|
11 |
+
"map_at_5": 0.16544,
|
12 |
+
"mrr_at_1": 0.22866,
|
13 |
+
"mrr_at_10": 0.34935,
|
14 |
+
"mrr_at_100": 0.35802,
|
15 |
+
"mrr_at_1000": 0.3584,
|
16 |
+
"mrr_at_3": 0.30966,
|
17 |
+
"mrr_at_5": 0.33204,
|
18 |
+
"ndcg_at_1": 0.22866,
|
19 |
+
"ndcg_at_10": 0.26595,
|
20 |
+
"ndcg_at_100": 0.33514,
|
21 |
+
"ndcg_at_1000": 0.36872,
|
22 |
+
"ndcg_at_3": 0.20667,
|
23 |
+
"ndcg_at_5": 0.22728,
|
24 |
+
"precision_at_1": 0.22866,
|
25 |
+
"precision_at_10": 0.08632,
|
26 |
+
"precision_at_100": 0.01612,
|
27 |
+
"precision_at_1000": 0.00224,
|
28 |
+
"precision_at_3": 0.15505,
|
29 |
+
"precision_at_5": 0.12404,
|
30 |
+
"recall_at_1": 0.10363,
|
31 |
+
"recall_at_10": 0.33494,
|
32 |
+
"recall_at_100": 0.57593,
|
33 |
+
"recall_at_1000": 0.76342,
|
34 |
+
"recall_at_3": 0.19157,
|
35 |
+
"recall_at_5": 0.24638
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/DBPedia.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 11184.99,
|
6 |
+
"map_at_1": 0.07436,
|
7 |
+
"map_at_10": 0.1476,
|
8 |
+
"map_at_100": 0.19206,
|
9 |
+
"map_at_1000": 0.20267,
|
10 |
+
"map_at_3": 0.10894,
|
11 |
+
"map_at_5": 0.12829,
|
12 |
+
"mrr_at_1": 0.5425,
|
13 |
+
"mrr_at_10": 0.63769,
|
14 |
+
"mrr_at_100": 0.64193,
|
15 |
+
"mrr_at_1000": 0.64211,
|
16 |
+
"mrr_at_3": 0.61458,
|
17 |
+
"mrr_at_5": 0.63096,
|
18 |
+
"ndcg_at_1": 0.42875,
|
19 |
+
"ndcg_at_10": 0.31507,
|
20 |
+
"ndcg_at_100": 0.34559,
|
21 |
+
"ndcg_at_1000": 0.41246,
|
22 |
+
"ndcg_at_3": 0.35058,
|
23 |
+
"ndcg_at_5": 0.33396,
|
24 |
+
"precision_at_1": 0.5425,
|
25 |
+
"precision_at_10": 0.2445,
|
26 |
+
"precision_at_100": 0.07383,
|
27 |
+
"precision_at_1000": 0.01582,
|
28 |
+
"precision_at_3": 0.38083,
|
29 |
+
"precision_at_5": 0.326,
|
30 |
+
"recall_at_1": 0.07436,
|
31 |
+
"recall_at_10": 0.19862,
|
32 |
+
"recall_at_100": 0.38981,
|
33 |
+
"recall_at_1000": 0.61038,
|
34 |
+
"recall_at_3": 0.11949,
|
35 |
+
"recall_at_5": 0.15562
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/EmotionClassification.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.46390000000000003,
|
6 |
+
"accuracy_stderr": 0.018785366645343925,
|
7 |
+
"evaluation_time": 31.09,
|
8 |
+
"f1": 0.42264248858567033,
|
9 |
+
"f1_stderr": 0.011565342464001555,
|
10 |
+
"main_score": 0.46390000000000003
|
11 |
+
}
|
12 |
+
}
|
evaluation/mteb/FEVER.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 17506.78,
|
6 |
+
"map_at_1": 0.50916,
|
7 |
+
"map_at_10": 0.62258,
|
8 |
+
"map_at_100": 0.62741,
|
9 |
+
"map_at_1000": 0.62763,
|
10 |
+
"map_at_3": 0.60018,
|
11 |
+
"map_at_5": 0.6142,
|
12 |
+
"mrr_at_1": 0.54965,
|
13 |
+
"mrr_at_10": 0.66554,
|
14 |
+
"mrr_at_100": 0.66966,
|
15 |
+
"mrr_at_1000": 0.66978,
|
16 |
+
"mrr_at_3": 0.64414,
|
17 |
+
"mrr_at_5": 0.6577,
|
18 |
+
"ndcg_at_1": 0.54965,
|
19 |
+
"ndcg_at_10": 0.6812,
|
20 |
+
"ndcg_at_100": 0.70282,
|
21 |
+
"ndcg_at_1000": 0.70788,
|
22 |
+
"ndcg_at_3": 0.63862,
|
23 |
+
"ndcg_at_5": 0.66216,
|
24 |
+
"precision_at_1": 0.54965,
|
25 |
+
"precision_at_10": 0.08998,
|
26 |
+
"precision_at_100": 0.01016,
|
27 |
+
"precision_at_1000": 0.00107,
|
28 |
+
"precision_at_3": 0.25618,
|
29 |
+
"precision_at_5": 0.16676,
|
30 |
+
"recall_at_1": 0.50916,
|
31 |
+
"recall_at_10": 0.8204,
|
32 |
+
"recall_at_100": 0.91689,
|
33 |
+
"recall_at_1000": 0.95349,
|
34 |
+
"recall_at_3": 0.70512,
|
35 |
+
"recall_at_5": 0.76299
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/FiQA2018.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 310.86,
|
6 |
+
"map_at_1": 0.13568,
|
7 |
+
"map_at_10": 0.23264,
|
8 |
+
"map_at_100": 0.24824,
|
9 |
+
"map_at_1000": 0.25014,
|
10 |
+
"map_at_3": 0.19724,
|
11 |
+
"map_at_5": 0.21772,
|
12 |
+
"mrr_at_1": 0.27315,
|
13 |
+
"mrr_at_10": 0.35935,
|
14 |
+
"mrr_at_100": 0.36929,
|
15 |
+
"mrr_at_1000": 0.36985,
|
16 |
+
"mrr_at_3": 0.33591,
|
17 |
+
"mrr_at_5": 0.34848,
|
18 |
+
"ndcg_at_1": 0.27315,
|
19 |
+
"ndcg_at_10": 0.29988,
|
20 |
+
"ndcg_at_100": 0.3641,
|
21 |
+
"ndcg_at_1000": 0.40185,
|
22 |
+
"ndcg_at_3": 0.26342,
|
23 |
+
"ndcg_at_5": 0.2768,
|
24 |
+
"precision_at_1": 0.27315,
|
25 |
+
"precision_at_10": 0.08565,
|
26 |
+
"precision_at_100": 0.01508,
|
27 |
+
"precision_at_1000": 0.00219,
|
28 |
+
"precision_at_3": 0.1785,
|
29 |
+
"precision_at_5": 0.13673,
|
30 |
+
"recall_at_1": 0.13568,
|
31 |
+
"recall_at_10": 0.37133,
|
32 |
+
"recall_at_100": 0.61475,
|
33 |
+
"recall_at_1000": 0.84372,
|
34 |
+
"recall_at_3": 0.24112,
|
35 |
+
"recall_at_5": 0.29507
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/HotpotQA.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 13678.13,
|
6 |
+
"map_at_1": 0.30878,
|
7 |
+
"map_at_10": 0.40868,
|
8 |
+
"map_at_100": 0.41694,
|
9 |
+
"map_at_1000": 0.41775,
|
10 |
+
"map_at_3": 0.3856,
|
11 |
+
"map_at_5": 0.39947,
|
12 |
+
"mrr_at_1": 0.61756,
|
13 |
+
"mrr_at_10": 0.68265,
|
14 |
+
"mrr_at_100": 0.68671,
|
15 |
+
"mrr_at_1000": 0.68694,
|
16 |
+
"mrr_at_3": 0.66784,
|
17 |
+
"mrr_at_5": 0.67704,
|
18 |
+
"ndcg_at_1": 0.61756,
|
19 |
+
"ndcg_at_10": 0.49931,
|
20 |
+
"ndcg_at_100": 0.53179,
|
21 |
+
"ndcg_at_1000": 0.54948,
|
22 |
+
"ndcg_at_3": 0.46103,
|
23 |
+
"ndcg_at_5": 0.48147,
|
24 |
+
"precision_at_1": 0.61756,
|
25 |
+
"precision_at_10": 0.10163,
|
26 |
+
"precision_at_100": 0.01271,
|
27 |
+
"precision_at_1000": 0.00151,
|
28 |
+
"precision_at_3": 0.28179,
|
29 |
+
"precision_at_5": 0.18528,
|
30 |
+
"recall_at_1": 0.30878,
|
31 |
+
"recall_at_10": 0.50817,
|
32 |
+
"recall_at_100": 0.63545,
|
33 |
+
"recall_at_1000": 0.75361,
|
34 |
+
"recall_at_3": 0.42269,
|
35 |
+
"recall_at_5": 0.4632
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/ImdbClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.6404799999999999,
|
6 |
+
"accuracy_stderr": 0.03197141223030349,
|
7 |
+
"ap": 0.5918525145533928,
|
8 |
+
"ap_stderr": 0.024531019346391677,
|
9 |
+
"evaluation_time": 915.58,
|
10 |
+
"f1": 0.6394712318134925,
|
11 |
+
"f1_stderr": 0.0317267000377415,
|
12 |
+
"main_score": 0.6404799999999999
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MSMARCO.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"validation": {
|
5 |
+
"evaluation_time": 22861.03,
|
6 |
+
"map_at_1": 0.189,
|
7 |
+
"map_at_10": 0.29748,
|
8 |
+
"map_at_100": 0.30976,
|
9 |
+
"map_at_1000": 0.31041,
|
10 |
+
"map_at_3": 0.26113,
|
11 |
+
"map_at_5": 0.28197,
|
12 |
+
"mrr_at_1": 0.19413,
|
13 |
+
"mrr_at_10": 0.30322,
|
14 |
+
"mrr_at_100": 0.31497,
|
15 |
+
"mrr_at_1000": 0.31555,
|
16 |
+
"mrr_at_3": 0.26729,
|
17 |
+
"mrr_at_5": 0.28789,
|
18 |
+
"ndcg_at_1": 0.19413,
|
19 |
+
"ndcg_at_10": 0.36048,
|
20 |
+
"ndcg_at_100": 0.42152,
|
21 |
+
"ndcg_at_1000": 0.43772,
|
22 |
+
"ndcg_at_3": 0.28642,
|
23 |
+
"ndcg_at_5": 0.32358,
|
24 |
+
"precision_at_1": 0.19413,
|
25 |
+
"precision_at_10": 0.05785,
|
26 |
+
"precision_at_100": 0.00887,
|
27 |
+
"precision_at_1000": 0.00103,
|
28 |
+
"precision_at_3": 0.12192,
|
29 |
+
"precision_at_5": 0.09189,
|
30 |
+
"recall_at_1": 0.189,
|
31 |
+
"recall_at_10": 0.55457,
|
32 |
+
"recall_at_100": 0.84091,
|
33 |
+
"recall_at_1000": 0.96482,
|
34 |
+
"recall_at_3": 0.35359,
|
35 |
+
"recall_at_5": 0.44275
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/MTOPDomainClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.9207706338349293,
|
7 |
+
"accuracy_stderr": 0.005541106237593856,
|
8 |
+
"f1": 0.9156680443236652,
|
9 |
+
"f1_stderr": 0.005216941657420623,
|
10 |
+
"main_score": 0.9207706338349293
|
11 |
+
},
|
12 |
+
"evaluation_time": 31.37
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MTOPIntentClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.7118559051527589,
|
7 |
+
"accuracy_stderr": 0.012419016906278644,
|
8 |
+
"f1": 0.5242887061726789,
|
9 |
+
"f1_stderr": 0.011199354119349208,
|
10 |
+
"main_score": 0.7118559051527589
|
11 |
+
},
|
12 |
+
"evaluation_time": 82.02
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MassiveIntentClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.6864828513786148,
|
7 |
+
"accuracy_stderr": 0.012244395475104431,
|
8 |
+
"f1": 0.6654281381596097,
|
9 |
+
"f1_stderr": 0.009337695311493243,
|
10 |
+
"main_score": 0.6864828513786148
|
11 |
+
},
|
12 |
+
"evaluation_time": 49.93
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MassiveScenarioClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.7604236718224613,
|
7 |
+
"accuracy_stderr": 0.009702648067132833,
|
8 |
+
"f1": 0.7589170458655639,
|
9 |
+
"f1_stderr": 0.009666037600064457,
|
10 |
+
"main_score": 0.7604236718224613
|
11 |
+
},
|
12 |
+
"evaluation_time": 29.65
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MedrxivClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1694.42,
|
6 |
+
"v_measure": 0.320840369055247,
|
7 |
+
"v_measure_std": 0.012975340075124157
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/MedrxivClusteringS2S.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 258.59,
|
6 |
+
"v_measure": 0.29448729560244535,
|
7 |
+
"v_measure_std": 0.014610308837145732
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/MindSmallReranking.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 18115.54,
|
6 |
+
"map": 0.31340856463122374,
|
7 |
+
"mrr": 0.32398547669840916
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/NFCorpus.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 101.25,
|
6 |
+
"map_at_1": 0.05526,
|
7 |
+
"map_at_10": 0.11745,
|
8 |
+
"map_at_100": 0.14831,
|
9 |
+
"map_at_1000": 0.16235,
|
10 |
+
"map_at_3": 0.08716,
|
11 |
+
"map_at_5": 0.10101,
|
12 |
+
"mrr_at_1": 0.43653,
|
13 |
+
"mrr_at_10": 0.51067,
|
14 |
+
"mrr_at_100": 0.51881,
|
15 |
+
"mrr_at_1000": 0.51912,
|
16 |
+
"mrr_at_3": 0.4902,
|
17 |
+
"mrr_at_5": 0.50289,
|
18 |
+
"ndcg_at_1": 0.4195,
|
19 |
+
"ndcg_at_10": 0.32083,
|
20 |
+
"ndcg_at_100": 0.3005,
|
21 |
+
"ndcg_at_1000": 0.38661,
|
22 |
+
"ndcg_at_3": 0.3794,
|
23 |
+
"ndcg_at_5": 0.35456,
|
24 |
+
"precision_at_1": 0.43344,
|
25 |
+
"precision_at_10": 0.23437,
|
26 |
+
"precision_at_100": 0.0783,
|
27 |
+
"precision_at_1000": 0.02053,
|
28 |
+
"precision_at_3": 0.35501,
|
29 |
+
"precision_at_5": 0.30464,
|
30 |
+
"recall_at_1": 0.05526,
|
31 |
+
"recall_at_10": 0.15446,
|
32 |
+
"recall_at_100": 0.31179,
|
33 |
+
"recall_at_1000": 0.61578,
|
34 |
+
"recall_at_3": 0.0971,
|
35 |
+
"recall_at_5": 0.12026
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/NQ.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 8091.11,
|
6 |
+
"map_at_1": 0.23467,
|
7 |
+
"map_at_10": 0.36041,
|
8 |
+
"map_at_100": 0.37268,
|
9 |
+
"map_at_1000": 0.37322,
|
10 |
+
"map_at_3": 0.3209,
|
11 |
+
"map_at_5": 0.34414,
|
12 |
+
"mrr_at_1": 0.26738,
|
13 |
+
"mrr_at_10": 0.38665,
|
14 |
+
"mrr_at_100": 0.3964,
|
15 |
+
"mrr_at_1000": 0.39681,
|
16 |
+
"mrr_at_3": 0.35207,
|
17 |
+
"mrr_at_5": 0.3731,
|
18 |
+
"ndcg_at_1": 0.26709,
|
19 |
+
"ndcg_at_10": 0.42942,
|
20 |
+
"ndcg_at_100": 0.48296,
|
21 |
+
"ndcg_at_1000": 0.49651,
|
22 |
+
"ndcg_at_3": 0.35413,
|
23 |
+
"ndcg_at_5": 0.39368,
|
24 |
+
"precision_at_1": 0.26709,
|
25 |
+
"precision_at_10": 0.07306,
|
26 |
+
"precision_at_100": 0.01029,
|
27 |
+
"precision_at_1000": 0.00116,
|
28 |
+
"precision_at_3": 0.16348,
|
29 |
+
"precision_at_5": 0.12068,
|
30 |
+
"recall_at_1": 0.23467,
|
31 |
+
"recall_at_10": 0.61493,
|
32 |
+
"recall_at_100": 0.85011,
|
33 |
+
"recall_at_1000": 0.95261,
|
34 |
+
"recall_at_3": 0.41952,
|
35 |
+
"recall_at_5": 0.51106
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/QuoraRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 742.32,
|
6 |
+
"map_at_1": 0.67517,
|
7 |
+
"map_at_10": 0.81054,
|
8 |
+
"map_at_100": 0.81727,
|
9 |
+
"map_at_1000": 0.81752,
|
10 |
+
"map_at_3": 0.78018,
|
11 |
+
"map_at_5": 0.79879,
|
12 |
+
"mrr_at_1": 0.7752,
|
13 |
+
"mrr_at_10": 0.84429,
|
14 |
+
"mrr_at_100": 0.84582,
|
15 |
+
"mrr_at_1000": 0.84584,
|
16 |
+
"mrr_at_3": 0.83268,
|
17 |
+
"mrr_at_5": 0.84013,
|
18 |
+
"ndcg_at_1": 0.7753,
|
19 |
+
"ndcg_at_10": 0.85277,
|
20 |
+
"ndcg_at_100": 0.86805,
|
21 |
+
"ndcg_at_1000": 0.8701,
|
22 |
+
"ndcg_at_3": 0.81975,
|
23 |
+
"ndcg_at_5": 0.83723,
|
24 |
+
"precision_at_1": 0.7753,
|
25 |
+
"precision_at_10": 0.12961,
|
26 |
+
"precision_at_100": 0.01502,
|
27 |
+
"precision_at_1000": 0.00156,
|
28 |
+
"precision_at_3": 0.35713,
|
29 |
+
"precision_at_5": 0.23574,
|
30 |
+
"recall_at_1": 0.67517,
|
31 |
+
"recall_at_10": 0.93486,
|
32 |
+
"recall_at_100": 0.989,
|
33 |
+
"recall_at_1000": 0.9993,
|
34 |
+
"recall_at_3": 0.8418,
|
35 |
+
"recall_at_5": 0.88975
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/RedditClustering.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 3324.44,
|
6 |
+
"v_measure": 0.48225994608749917,
|
7 |
+
"v_measure_std": 0.055941572162319216
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/RedditClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 13390.64,
|
6 |
+
"v_measure": 0.5317635557157765,
|
7 |
+
"v_measure_std": 0.12570620726605897
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/SCIDOCS.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 214.39,
|
6 |
+
"map_at_1": 0.03988,
|
7 |
+
"map_at_10": 0.094,
|
8 |
+
"map_at_100": 0.10968,
|
9 |
+
"map_at_1000": 0.11257,
|
10 |
+
"map_at_3": 0.07123,
|
11 |
+
"map_at_5": 0.08221,
|
12 |
+
"mrr_at_1": 0.197,
|
13 |
+
"mrr_at_10": 0.29098,
|
14 |
+
"mrr_at_100": 0.30247,
|
15 |
+
"mrr_at_1000": 0.30318,
|
16 |
+
"mrr_at_3": 0.2655,
|
17 |
+
"mrr_at_5": 0.27915,
|
18 |
+
"ndcg_at_1": 0.197,
|
19 |
+
"ndcg_at_10": 0.16176,
|
20 |
+
"ndcg_at_100": 0.22931,
|
21 |
+
"ndcg_at_1000": 0.28301,
|
22 |
+
"ndcg_at_3": 0.16142,
|
23 |
+
"ndcg_at_5": 0.13634,
|
24 |
+
"precision_at_1": 0.197,
|
25 |
+
"precision_at_10": 0.0818,
|
26 |
+
"precision_at_100": 0.01801,
|
27 |
+
"precision_at_1000": 0.00309,
|
28 |
+
"precision_at_3": 0.151,
|
29 |
+
"precision_at_5": 0.1174,
|
30 |
+
"recall_at_1": 0.03988,
|
31 |
+
"recall_at_10": 0.16625,
|
32 |
+
"recall_at_100": 0.3661,
|
33 |
+
"recall_at_1000": 0.62805,
|
34 |
+
"recall_at_3": 0.09168,
|
35 |
+
"recall_at_5": 0.11902
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/SGPT-1.3B-weightedmean-msmarco-specb-bitfit_results.csv
ADDED
@@ -0,0 +1,355 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model,task,dataset,language,metric,value
|
2 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,BitextMining,BUCC,,f1,
|
3 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,BitextMining,Tatoeba,,f1,
|
4 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en,accuracy,0.652089552238806
|
5 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
|
6 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
|
7 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
|
8 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
|
9 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
|
10 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
|
11 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonPolarityClassification,en,accuracy,0.7320565
|
12 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,en,accuracy,0.34956
|
13 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
|
14 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
|
15 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
|
16 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
|
17 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
|
18 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
|
19 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
|
20 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
|
21 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
|
22 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
|
23 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,Banking77Classification,en,accuracy,0.8205844155844156
|
24 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,EmotionClassification,en,accuracy,0.46390000000000003
|
25 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,ImdbClassification,en,accuracy,0.6404799999999999
|
26 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
|
27 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
|
28 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
|
29 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
|
30 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
|
31 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
|
32 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
|
33 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
|
34 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
|
35 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
|
36 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
|
37 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
|
38 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
|
39 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
|
40 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
|
41 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
|
42 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
|
43 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
|
44 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,en,accuracy,0.6864828513786148
|
45 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
|
46 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
|
47 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
|
48 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
|
49 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
|
50 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
|
51 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
|
52 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
|
53 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
|
54 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
|
55 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
|
56 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
|
57 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
|
58 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
|
59 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
|
60 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
|
61 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
|
62 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
|
63 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
|
64 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
|
65 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
|
66 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
|
67 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
|
68 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
|
69 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
|
70 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
|
71 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
|
72 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
|
73 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
|
74 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
|
75 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
|
76 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
|
77 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
|
78 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
|
79 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
|
80 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
|
81 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
|
82 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
|
83 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
|
84 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
|
85 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
|
86 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
|
87 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
|
88 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
|
89 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
|
90 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
|
91 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
|
92 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
|
93 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
|
94 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
|
95 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
|
96 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
|
97 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
|
98 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
|
99 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
|
100 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
|
101 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
|
102 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
|
103 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
|
104 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
|
105 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
|
106 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
|
107 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
|
108 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
|
109 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
|
110 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
|
111 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
|
112 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
|
113 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
|
114 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
|
115 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
|
116 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
|
117 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
|
118 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
|
119 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
|
120 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
|
121 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
|
122 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
|
123 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
|
124 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
|
125 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
|
126 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
|
127 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
|
128 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
|
129 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
|
130 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
|
131 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
|
132 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
|
133 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
|
134 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
|
135 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
|
136 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
|
137 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
|
138 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
|
139 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
|
140 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
|
141 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
|
142 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
|
143 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
|
144 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
|
145 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,en,accuracy,0.7604236718224613
|
146 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
|
147 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
|
148 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
|
149 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
|
150 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
|
151 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
|
152 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
|
153 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
|
154 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
|
155 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
|
156 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
|
157 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
|
158 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
|
159 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
|
160 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
|
161 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
|
162 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
|
163 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
|
164 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
|
165 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
|
166 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
|
167 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
|
168 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
|
169 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
|
170 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
|
171 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
|
172 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
|
173 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
|
174 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
|
175 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
|
176 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
|
177 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
|
178 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
|
179 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
|
180 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
|
181 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
|
182 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
|
183 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
|
184 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
|
185 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
|
186 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
|
187 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
|
188 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
|
189 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
|
190 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
|
191 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
|
192 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
|
193 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
|
194 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
|
195 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
|
196 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
|
197 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
|
198 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
|
199 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
|
200 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
|
201 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
|
202 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
|
203 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
|
204 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
|
205 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
|
206 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
|
207 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
|
208 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
|
209 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
|
210 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
|
211 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
|
212 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
|
213 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
|
214 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
|
215 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
|
216 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
|
217 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
|
218 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
|
219 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
|
220 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
|
221 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
|
222 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
|
223 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
|
224 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
|
225 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
|
226 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
|
227 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
|
228 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,en,accuracy,0.9207706338349293
|
229 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
|
230 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
|
231 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
|
232 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
|
233 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
|
234 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
|
235 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
|
236 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
|
237 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
|
238 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
|
239 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,en,accuracy,0.7118559051527589
|
240 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
|
241 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
|
242 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
|
243 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
|
244 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
|
245 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
|
246 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
|
247 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
|
248 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
|
249 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
|
250 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,ToxicConversationsClassification,en,accuracy,0.687272
|
251 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,TweetSentimentExtractionClassification,en,accuracy,0.556677985285795
|
252 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringP2P,en,v_measure,0.4338419491695377
|
253 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringS2S,en,v_measure,0.3370962633433912
|
254 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringP2P,en,v_measure,0.3505918333141837
|
255 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringS2S,en,v_measure,0.3071055028830579
|
256 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringP2P,en,v_measure,0.320840369055247
|
257 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringS2S,en,v_measure,0.29448729560244535
|
258 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClustering,en,v_measure,0.48225994608749917
|
259 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClusteringP2P,en,v_measure,0.5317635557157765
|
260 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClustering,en,v_measure,0.6085593925770172
|
261 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClusteringP2P,en,v_measure,0.323567729982375
|
262 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,TwentyNewsgroupsClustering,en,v_measure,0.4005809562275603
|
263 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,SprintDuplicateQuestions,en,ap,0.9257836032673468
|
264 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterSemEval2015,en,ap,0.6237052608803734
|
265 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterURLCorpus,en,ap,0.8378748636891035
|
266 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,AskUbuntuDupQuestions,en,map,0.5813305899687008
|
267 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,MindSmallReranking,en,map,0.31340856463122374
|
268 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,SciDocsRR,en,map,0.7721233007730808
|
269 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,StackOverflowDupQuestions,en,map,0.49320607035290737
|
270 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,ArguAna,en,ndcg_at_10,0.4968
|
271 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,ClimateFEVER,en,ndcg_at_10,0.26595
|
272 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,CQADupstackRetrieval,en,ndcg_at_10,0.3332616666666667
|
273 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,DBPedia,en,ndcg_at_10,0.31507
|
274 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,FEVER,en,ndcg_at_10,0.6812
|
275 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,FiQA2018,en,ndcg_at_10,0.29988
|
276 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,HotpotQA,en,ndcg_at_10,0.49931
|
277 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,MSMARCO,en,ndcg_at_10,0.36048
|
278 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,NFCorpus,en,ndcg_at_10,0.32083
|
279 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,NQ,en,ndcg_at_10,0.42942
|
280 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,QuoraRetrieval,en,ndcg_at_10,0.85277
|
281 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,SCIDOCS,en,ndcg_at_10,0.16176
|
282 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,SciFact,en,ndcg_at_10,0.68287
|
283 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,Touche2020,en,ndcg_at_10,0.2445
|
284 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,TRECCOVID,en,ndcg_at_10,0.7298
|
285 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,BIOSSES,en,cosine_spearman,0.8301514456843275
|
286 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,SICK-R,en,cosine_spearman,0.6722953551111448
|
287 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS12,en,cosine_spearman,0.6659241013465915
|
288 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS13,en,cosine_spearman,0.7733151317062642
|
289 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS14,en,cosine_spearman,0.7182815265534886
|
290 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS15,en,cosine_spearman,0.8065931167868883
|
291 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS16,en,cosine_spearman,0.7891151365939403
|
292 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
|
293 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
|
294 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
|
295 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
|
296 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
|
297 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
|
298 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
|
299 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
|
300 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-en,cosine_spearman,0.8698674844768606
|
301 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
|
302 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
|
303 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
|
304 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
|
305 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
|
306 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
|
307 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
|
308 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
|
309 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
|
310 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
|
311 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
|
312 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
|
313 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,en,cosine_spearman,0.6730387805090023
|
314 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
|
315 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
|
316 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
|
317 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
|
318 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
|
319 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
|
320 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
|
321 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
|
322 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
|
323 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
|
324 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
|
325 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
|
326 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
|
327 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
|
328 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
|
329 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
|
330 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
|
331 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
|
332 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
|
333 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
|
334 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
|
335 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
|
336 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
|
337 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
|
338 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
|
339 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
|
340 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
|
341 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
|
342 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
|
343 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
|
344 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
|
345 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
|
346 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
|
347 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
|
348 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STSBenchmark,en,cosine_spearman,0.775887175717799
|
349 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Summarization,SummEval,en,cosine_spearman,0.25440272876996695
|
350 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,average,en,accuracy,0.6651794596081484
|
351 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,average,en,v_measure,0.3991540721780082
|
352 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,average,en,ap,0.7957879092789413
|
353 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,average,en,map,0.5400171314314782
|
354 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,average,en,ndcg_at_10,0.4449267777777778
|
355 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,average,en,cosine_spearman,0.7574469254486307
|
evaluation/mteb/SICK-R.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.7729330379162072,
|
7 |
+
"spearman": 0.6722953551111448
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.7144682700059415,
|
11 |
+
"spearman": 0.6633178012153248
|
12 |
+
},
|
13 |
+
"evaluation_time": 52.38,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.7146941734657887,
|
16 |
+
"spearman": 0.6643234359835815
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|
evaluation/mteb/STS12.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.7540943196466576,
|
7 |
+
"spearman": 0.6659241013465915
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.7132500540796616,
|
11 |
+
"spearman": 0.6786667467202591
|
12 |
+
},
|
13 |
+
"evaluation_time": 26.18,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.7148209832089134,
|
16 |
+
"spearman": 0.6794511626964879
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|
evaluation/mteb/STS13.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.7708302398877518,
|
7 |
+
"spearman": 0.7733151317062642
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.7677020279715008,
|
11 |
+
"spearman": 0.7713893776083225
|
12 |
+
},
|
13 |
+
"evaluation_time": 12.09,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.7676732290707478,
|
16 |
+
"spearman": 0.7714500877396631
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|