Commit
·
5d4e702
1
Parent(s):
7853d0d
Add MTEB evaluation
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- {eval → evaluation/beir}/beir.json +0 -0
- evaluation/mteb/AmazonCounterfactualClassification.json +16 -0
- evaluation/mteb/AmazonPolarityClassification.json +14 -0
- evaluation/mteb/AmazonReviewsClassification.json +14 -0
- evaluation/mteb/ArguAna.json +37 -0
- evaluation/mteb/ArxivClusteringP2P.json +9 -0
- evaluation/mteb/ArxivClusteringS2S.json +9 -0
- evaluation/mteb/AskUbuntuDupQuestions.json +9 -0
- evaluation/mteb/BIOSSES.json +19 -0
- evaluation/mteb/Banking77Classification.json +12 -0
- evaluation/mteb/BiorxivClusteringP2P.json +9 -0
- evaluation/mteb/BiorxivClusteringS2S.json +9 -0
- evaluation/mteb/CQADupstackAndroidRetrieval.json +37 -0
- evaluation/mteb/CQADupstackEnglishRetrieval.json +37 -0
- evaluation/mteb/CQADupstackGamingRetrieval.json +37 -0
- evaluation/mteb/CQADupstackGisRetrieval.json +37 -0
- evaluation/mteb/CQADupstackMathematicaRetrieval.json +37 -0
- evaluation/mteb/CQADupstackPhysicsRetrieval.json +37 -0
- evaluation/mteb/CQADupstackProgrammersRetrieval.json +37 -0
- evaluation/mteb/CQADupstackRetrieval.json +1 -0
- evaluation/mteb/CQADupstackStatsRetrieval.json +37 -0
- evaluation/mteb/CQADupstackTexRetrieval.json +37 -0
- evaluation/mteb/CQADupstackUnixRetrieval.json +37 -0
- evaluation/mteb/CQADupstackWebmastersRetrieval.json +37 -0
- evaluation/mteb/CQADupstackWordpressRetrieval.json +37 -0
- evaluation/mteb/ClimateFEVER.json +37 -0
- evaluation/mteb/DBPedia.json +37 -0
- evaluation/mteb/EmotionClassification.json +12 -0
- evaluation/mteb/FEVER.json +37 -0
- evaluation/mteb/FiQA2018.json +37 -0
- evaluation/mteb/HotpotQA.json +37 -0
- evaluation/mteb/ImdbClassification.json +14 -0
- evaluation/mteb/MSMARCO.json +37 -0
- evaluation/mteb/MTOPDomainClassification.json +14 -0
- evaluation/mteb/MTOPIntentClassification.json +14 -0
- evaluation/mteb/MassiveIntentClassification.json +14 -0
- evaluation/mteb/MassiveScenarioClassification.json +14 -0
- evaluation/mteb/MedrxivClusteringP2P.json +9 -0
- evaluation/mteb/MedrxivClusteringS2S.json +9 -0
- evaluation/mteb/MindSmallReranking.json +9 -0
- evaluation/mteb/NFCorpus.json +37 -0
- evaluation/mteb/NQ.json +37 -0
- evaluation/mteb/QuoraRetrieval.json +37 -0
- evaluation/mteb/RedditClustering.json +9 -0
- evaluation/mteb/RedditClusteringP2P.json +9 -0
- evaluation/mteb/SCIDOCS.json +37 -0
- evaluation/mteb/SGPT-1.3B-weightedmean-msmarco-specb-bitfit_results.csv +355 -0
- evaluation/mteb/SICK-R.json +19 -0
- evaluation/mteb/STS12.json +19 -0
- evaluation/mteb/STS13.json +19 -0
{eval → evaluation/beir}/beir.json
RENAMED
|
File without changes
|
evaluation/mteb/AmazonCounterfactualClassification.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"en": {
|
| 6 |
+
"accuracy": 0.652089552238806,
|
| 7 |
+
"accuracy_stderr": 0.04707742824740793,
|
| 8 |
+
"ap": 0.2959212705444778,
|
| 9 |
+
"ap_stderr": 0.022393345886320606,
|
| 10 |
+
"f1": 0.5997099864321921,
|
| 11 |
+
"f1_stderr": 0.036697739411917986,
|
| 12 |
+
"main_score": 0.652089552238806
|
| 13 |
+
},
|
| 14 |
+
"evaluation_time": 23.71
|
| 15 |
+
}
|
| 16 |
+
}
|
evaluation/mteb/AmazonPolarityClassification.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"accuracy": 0.7320565,
|
| 6 |
+
"accuracy_stderr": 0.04094219950430119,
|
| 7 |
+
"ap": 0.6736680643550963,
|
| 8 |
+
"ap_stderr": 0.03652809962256317,
|
| 9 |
+
"evaluation_time": 7801.59,
|
| 10 |
+
"f1": 0.7290420520325125,
|
| 11 |
+
"f1_stderr": 0.04396494850187113,
|
| 12 |
+
"main_score": 0.7320565
|
| 13 |
+
}
|
| 14 |
+
}
|
evaluation/mteb/AmazonReviewsClassification.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"en": {
|
| 6 |
+
"accuracy": 0.34956,
|
| 7 |
+
"accuracy_stderr": 0.018705464442242543,
|
| 8 |
+
"f1": 0.3471932443769695,
|
| 9 |
+
"f1_stderr": 0.017698150667922033,
|
| 10 |
+
"main_score": 0.34956
|
| 11 |
+
},
|
| 12 |
+
"evaluation_time": 73.75
|
| 13 |
+
}
|
| 14 |
+
}
|
evaluation/mteb/ArguAna.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 159.23,
|
| 6 |
+
"map_at_1": 0.26102,
|
| 7 |
+
"map_at_10": 0.40958,
|
| 8 |
+
"map_at_100": 0.42033,
|
| 9 |
+
"map_at_1000": 0.42042,
|
| 10 |
+
"map_at_3": 0.36332,
|
| 11 |
+
"map_at_5": 0.38608,
|
| 12 |
+
"mrr_at_1": 0.26387,
|
| 13 |
+
"mrr_at_10": 0.41051,
|
| 14 |
+
"mrr_at_100": 0.42118,
|
| 15 |
+
"mrr_at_1000": 0.42127,
|
| 16 |
+
"mrr_at_3": 0.36415,
|
| 17 |
+
"mrr_at_5": 0.3872,
|
| 18 |
+
"ndcg_at_1": 0.26102,
|
| 19 |
+
"ndcg_at_10": 0.4968,
|
| 20 |
+
"ndcg_at_100": 0.54258,
|
| 21 |
+
"ndcg_at_1000": 0.54486,
|
| 22 |
+
"ndcg_at_3": 0.39864,
|
| 23 |
+
"ndcg_at_5": 0.4398,
|
| 24 |
+
"precision_at_1": 0.26102,
|
| 25 |
+
"precision_at_10": 0.07781,
|
| 26 |
+
"precision_at_100": 0.00979,
|
| 27 |
+
"precision_at_1000": 0.001,
|
| 28 |
+
"precision_at_3": 0.16714,
|
| 29 |
+
"precision_at_5": 0.12034,
|
| 30 |
+
"recall_at_1": 0.26102,
|
| 31 |
+
"recall_at_10": 0.77809,
|
| 32 |
+
"recall_at_100": 0.97866,
|
| 33 |
+
"recall_at_1000": 0.99644,
|
| 34 |
+
"recall_at_3": 0.50142,
|
| 35 |
+
"recall_at_5": 0.60171
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/ArxivClusteringP2P.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 28476.56,
|
| 6 |
+
"v_measure": 0.4338419491695377,
|
| 7 |
+
"v_measure_std": 0.13772932292188322
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/ArxivClusteringS2S.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 3597.82,
|
| 6 |
+
"v_measure": 0.3370962633433912,
|
| 7 |
+
"v_measure_std": 0.14057785790111033
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/AskUbuntuDupQuestions.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 29.27,
|
| 6 |
+
"map": 0.5813305899687008,
|
| 7 |
+
"mrr": 0.7210922041946972
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/BIOSSES.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"cos_sim": {
|
| 6 |
+
"pearson": 0.8662153841660047,
|
| 7 |
+
"spearman": 0.8301514456843275
|
| 8 |
+
},
|
| 9 |
+
"euclidean": {
|
| 10 |
+
"pearson": 0.8600431518427242,
|
| 11 |
+
"spearman": 0.8385552516285784
|
| 12 |
+
},
|
| 13 |
+
"evaluation_time": 4.47,
|
| 14 |
+
"manhattan": {
|
| 15 |
+
"pearson": 0.8583025803351181,
|
| 16 |
+
"spearman": 0.8386636878343106
|
| 17 |
+
}
|
| 18 |
+
}
|
| 19 |
+
}
|
evaluation/mteb/Banking77Classification.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"accuracy": 0.8205844155844156,
|
| 6 |
+
"accuracy_stderr": 0.00898031054024437,
|
| 7 |
+
"evaluation_time": 70.71,
|
| 8 |
+
"f1": 0.8201858378847641,
|
| 9 |
+
"f1_stderr": 0.009423967637409204,
|
| 10 |
+
"main_score": 0.8205844155844156
|
| 11 |
+
}
|
| 12 |
+
}
|
evaluation/mteb/BiorxivClusteringP2P.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 3352.83,
|
| 6 |
+
"v_measure": 0.3505918333141837,
|
| 7 |
+
"v_measure_std": 0.00847894603883707
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/BiorxivClusteringS2S.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 435.49,
|
| 6 |
+
"v_measure": 0.3071055028830579,
|
| 7 |
+
"v_measure_std": 0.008981834294010968
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/CQADupstackAndroidRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 575.19,
|
| 6 |
+
"map_at_1": 0.26519,
|
| 7 |
+
"map_at_10": 0.35634,
|
| 8 |
+
"map_at_100": 0.36961,
|
| 9 |
+
"map_at_1000": 0.37088,
|
| 10 |
+
"map_at_3": 0.32254,
|
| 11 |
+
"map_at_5": 0.3422,
|
| 12 |
+
"mrr_at_1": 0.32332,
|
| 13 |
+
"mrr_at_10": 0.41168,
|
| 14 |
+
"mrr_at_100": 0.41977,
|
| 15 |
+
"mrr_at_1000": 0.42029,
|
| 16 |
+
"mrr_at_3": 0.38197,
|
| 17 |
+
"mrr_at_5": 0.40036,
|
| 18 |
+
"ndcg_at_1": 0.32332,
|
| 19 |
+
"ndcg_at_10": 0.41471,
|
| 20 |
+
"ndcg_at_100": 0.46956,
|
| 21 |
+
"ndcg_at_1000": 0.49262,
|
| 22 |
+
"ndcg_at_3": 0.35938,
|
| 23 |
+
"ndcg_at_5": 0.38703,
|
| 24 |
+
"precision_at_1": 0.32332,
|
| 25 |
+
"precision_at_10": 0.07783,
|
| 26 |
+
"precision_at_100": 0.0129,
|
| 27 |
+
"precision_at_1000": 0.00178,
|
| 28 |
+
"precision_at_3": 0.16834,
|
| 29 |
+
"precision_at_5": 0.12418,
|
| 30 |
+
"recall_at_1": 0.26519,
|
| 31 |
+
"recall_at_10": 0.5319,
|
| 32 |
+
"recall_at_100": 0.76565,
|
| 33 |
+
"recall_at_1000": 0.91478,
|
| 34 |
+
"recall_at_3": 0.38034,
|
| 35 |
+
"recall_at_5": 0.45246
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackEnglishRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 874.22,
|
| 6 |
+
"map_at_1": 0.25356,
|
| 7 |
+
"map_at_10": 0.34596,
|
| 8 |
+
"map_at_100": 0.35714,
|
| 9 |
+
"map_at_1000": 0.3584,
|
| 10 |
+
"map_at_3": 0.32073,
|
| 11 |
+
"map_at_5": 0.33475,
|
| 12 |
+
"mrr_at_1": 0.31274,
|
| 13 |
+
"mrr_at_10": 0.39592,
|
| 14 |
+
"mrr_at_100": 0.40284,
|
| 15 |
+
"mrr_at_1000": 0.4034,
|
| 16 |
+
"mrr_at_3": 0.37378,
|
| 17 |
+
"mrr_at_5": 0.38658,
|
| 18 |
+
"ndcg_at_1": 0.31274,
|
| 19 |
+
"ndcg_at_10": 0.39766,
|
| 20 |
+
"ndcg_at_100": 0.44028,
|
| 21 |
+
"ndcg_at_1000": 0.46445,
|
| 22 |
+
"ndcg_at_3": 0.35934,
|
| 23 |
+
"ndcg_at_5": 0.37751,
|
| 24 |
+
"precision_at_1": 0.31274,
|
| 25 |
+
"precision_at_10": 0.07452,
|
| 26 |
+
"precision_at_100": 0.01217,
|
| 27 |
+
"precision_at_1000": 0.0017,
|
| 28 |
+
"precision_at_3": 0.17431,
|
| 29 |
+
"precision_at_5": 0.12306,
|
| 30 |
+
"recall_at_1": 0.25356,
|
| 31 |
+
"recall_at_10": 0.49344,
|
| 32 |
+
"recall_at_100": 0.67497,
|
| 33 |
+
"recall_at_1000": 0.83372,
|
| 34 |
+
"recall_at_3": 0.38227,
|
| 35 |
+
"recall_at_5": 0.43188
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackGamingRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 931.63,
|
| 6 |
+
"map_at_1": 0.32759,
|
| 7 |
+
"map_at_10": 0.43937,
|
| 8 |
+
"map_at_100": 0.45004,
|
| 9 |
+
"map_at_1000": 0.4507,
|
| 10 |
+
"map_at_3": 0.40805,
|
| 11 |
+
"map_at_5": 0.42497,
|
| 12 |
+
"mrr_at_1": 0.37367,
|
| 13 |
+
"mrr_at_10": 0.47237,
|
| 14 |
+
"mrr_at_100": 0.47973,
|
| 15 |
+
"mrr_at_1000": 0.48011,
|
| 16 |
+
"mrr_at_3": 0.4465,
|
| 17 |
+
"mrr_at_5": 0.46051,
|
| 18 |
+
"ndcg_at_1": 0.37367,
|
| 19 |
+
"ndcg_at_10": 0.49659,
|
| 20 |
+
"ndcg_at_100": 0.54069,
|
| 21 |
+
"ndcg_at_1000": 0.55552,
|
| 22 |
+
"ndcg_at_3": 0.44169,
|
| 23 |
+
"ndcg_at_5": 0.46726,
|
| 24 |
+
"precision_at_1": 0.37367,
|
| 25 |
+
"precision_at_10": 0.08163,
|
| 26 |
+
"precision_at_100": 0.01133,
|
| 27 |
+
"precision_at_1000": 0.00131,
|
| 28 |
+
"precision_at_3": 0.19707,
|
| 29 |
+
"precision_at_5": 0.13718,
|
| 30 |
+
"recall_at_1": 0.32759,
|
| 31 |
+
"recall_at_10": 0.63341,
|
| 32 |
+
"recall_at_100": 0.82502,
|
| 33 |
+
"recall_at_1000": 0.93259,
|
| 34 |
+
"recall_at_3": 0.48796,
|
| 35 |
+
"recall_at_5": 0.54921
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackGisRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 1290.88,
|
| 6 |
+
"map_at_1": 0.18962,
|
| 7 |
+
"map_at_10": 0.25863,
|
| 8 |
+
"map_at_100": 0.26818,
|
| 9 |
+
"map_at_1000": 0.26918,
|
| 10 |
+
"map_at_3": 0.23043,
|
| 11 |
+
"map_at_5": 0.24599,
|
| 12 |
+
"mrr_at_1": 0.20452,
|
| 13 |
+
"mrr_at_10": 0.27301,
|
| 14 |
+
"mrr_at_100": 0.28233,
|
| 15 |
+
"mrr_at_1000": 0.2831,
|
| 16 |
+
"mrr_at_3": 0.24539,
|
| 17 |
+
"mrr_at_5": 0.26109,
|
| 18 |
+
"ndcg_at_1": 0.20452,
|
| 19 |
+
"ndcg_at_10": 0.30355,
|
| 20 |
+
"ndcg_at_100": 0.35336,
|
| 21 |
+
"ndcg_at_1000": 0.37927,
|
| 22 |
+
"ndcg_at_3": 0.24705,
|
| 23 |
+
"ndcg_at_5": 0.2742,
|
| 24 |
+
"precision_at_1": 0.20452,
|
| 25 |
+
"precision_at_10": 0.04949,
|
| 26 |
+
"precision_at_100": 0.0078,
|
| 27 |
+
"precision_at_1000": 0.00104,
|
| 28 |
+
"precision_at_3": 0.10358,
|
| 29 |
+
"precision_at_5": 0.07774,
|
| 30 |
+
"recall_at_1": 0.18962,
|
| 31 |
+
"recall_at_10": 0.43056,
|
| 32 |
+
"recall_at_100": 0.66273,
|
| 33 |
+
"recall_at_1000": 0.8596,
|
| 34 |
+
"recall_at_3": 0.27776,
|
| 35 |
+
"recall_at_5": 0.34287
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackMathematicaRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 686.89,
|
| 6 |
+
"map_at_1": 0.1124,
|
| 7 |
+
"map_at_10": 0.18503,
|
| 8 |
+
"map_at_100": 0.19553,
|
| 9 |
+
"map_at_1000": 0.1969,
|
| 10 |
+
"map_at_3": 0.1615,
|
| 11 |
+
"map_at_5": 0.17254,
|
| 12 |
+
"mrr_at_1": 0.13806,
|
| 13 |
+
"mrr_at_10": 0.21939,
|
| 14 |
+
"mrr_at_100": 0.22827,
|
| 15 |
+
"mrr_at_1000": 0.22911,
|
| 16 |
+
"mrr_at_3": 0.1932,
|
| 17 |
+
"mrr_at_5": 0.20558,
|
| 18 |
+
"ndcg_at_1": 0.13806,
|
| 19 |
+
"ndcg_at_10": 0.23383,
|
| 20 |
+
"ndcg_at_100": 0.28834,
|
| 21 |
+
"ndcg_at_1000": 0.32175,
|
| 22 |
+
"ndcg_at_3": 0.18652,
|
| 23 |
+
"ndcg_at_5": 0.20505,
|
| 24 |
+
"precision_at_1": 0.13806,
|
| 25 |
+
"precision_at_10": 0.04714,
|
| 26 |
+
"precision_at_100": 0.00864,
|
| 27 |
+
"precision_at_1000": 0.0013,
|
| 28 |
+
"precision_at_3": 0.09328,
|
| 29 |
+
"precision_at_5": 0.06841,
|
| 30 |
+
"recall_at_1": 0.1124,
|
| 31 |
+
"recall_at_10": 0.34854,
|
| 32 |
+
"recall_at_100": 0.59503,
|
| 33 |
+
"recall_at_1000": 0.8325,
|
| 34 |
+
"recall_at_3": 0.2202,
|
| 35 |
+
"recall_at_5": 0.26715
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackPhysicsRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 1269.26,
|
| 6 |
+
"map_at_1": 0.23012,
|
| 7 |
+
"map_at_10": 0.33048,
|
| 8 |
+
"map_at_100": 0.34371,
|
| 9 |
+
"map_at_1000": 0.34489,
|
| 10 |
+
"map_at_3": 0.29943,
|
| 11 |
+
"map_at_5": 0.31602,
|
| 12 |
+
"mrr_at_1": 0.28104,
|
| 13 |
+
"mrr_at_10": 0.3799,
|
| 14 |
+
"mrr_at_100": 0.38836,
|
| 15 |
+
"mrr_at_1000": 0.38891,
|
| 16 |
+
"mrr_at_3": 0.35226,
|
| 17 |
+
"mrr_at_5": 0.36694,
|
| 18 |
+
"ndcg_at_1": 0.28104,
|
| 19 |
+
"ndcg_at_10": 0.39037,
|
| 20 |
+
"ndcg_at_100": 0.44643,
|
| 21 |
+
"ndcg_at_1000": 0.46939,
|
| 22 |
+
"ndcg_at_3": 0.33784,
|
| 23 |
+
"ndcg_at_5": 0.36126,
|
| 24 |
+
"precision_at_1": 0.28104,
|
| 25 |
+
"precision_at_10": 0.07267,
|
| 26 |
+
"precision_at_100": 0.01193,
|
| 27 |
+
"precision_at_1000": 0.00159,
|
| 28 |
+
"precision_at_3": 0.16298,
|
| 29 |
+
"precision_at_5": 0.11684,
|
| 30 |
+
"recall_at_1": 0.23012,
|
| 31 |
+
"recall_at_10": 0.52054,
|
| 32 |
+
"recall_at_100": 0.75622,
|
| 33 |
+
"recall_at_1000": 0.90675,
|
| 34 |
+
"recall_at_3": 0.37282,
|
| 35 |
+
"recall_at_5": 0.43307
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackProgrammersRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 1185.95,
|
| 6 |
+
"map_at_1": 0.21624,
|
| 7 |
+
"map_at_10": 0.3021,
|
| 8 |
+
"map_at_100": 0.3152,
|
| 9 |
+
"map_at_1000": 0.31626,
|
| 10 |
+
"map_at_3": 0.26951,
|
| 11 |
+
"map_at_5": 0.28939,
|
| 12 |
+
"mrr_at_1": 0.26941,
|
| 13 |
+
"mrr_at_10": 0.3513,
|
| 14 |
+
"mrr_at_100": 0.3615,
|
| 15 |
+
"mrr_at_1000": 0.36204,
|
| 16 |
+
"mrr_at_3": 0.3242,
|
| 17 |
+
"mrr_at_5": 0.34155,
|
| 18 |
+
"ndcg_at_1": 0.26941,
|
| 19 |
+
"ndcg_at_10": 0.35726,
|
| 20 |
+
"ndcg_at_100": 0.41725,
|
| 21 |
+
"ndcg_at_1000": 0.44105,
|
| 22 |
+
"ndcg_at_3": 0.30184,
|
| 23 |
+
"ndcg_at_5": 0.33176,
|
| 24 |
+
"precision_at_1": 0.26941,
|
| 25 |
+
"precision_at_10": 0.06655,
|
| 26 |
+
"precision_at_100": 0.01152,
|
| 27 |
+
"precision_at_1000": 0.00152,
|
| 28 |
+
"precision_at_3": 0.14346,
|
| 29 |
+
"precision_at_5": 0.10868,
|
| 30 |
+
"recall_at_1": 0.21624,
|
| 31 |
+
"recall_at_10": 0.47359,
|
| 32 |
+
"recall_at_100": 0.73436,
|
| 33 |
+
"recall_at_1000": 0.89988,
|
| 34 |
+
"recall_at_3": 0.3234,
|
| 35 |
+
"recall_at_5": 0.39856
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackRetrieval.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"dataset_version": null, "mteb_version": "0.0.2", "test": {"evaluation_time": 1798.61, "map_at_1": 0.2067566666666667, "map_at_10": 0.28479333333333334, "map_at_100": 0.29612249999999996, "map_at_1000": 0.29731166666666664, "map_at_3": 0.25884, "map_at_5": 0.27298916666666667, "mrr_at_1": 0.24402583333333333, "mrr_at_10": 0.3207041666666667, "mrr_at_100": 0.32958416666666673, "mrr_at_1000": 0.3302541666666666, "mrr_at_3": 0.29677749999999997, "mrr_at_5": 0.3102391666666667, "ndcg_at_1": 0.24402583333333333, "ndcg_at_10": 0.3332616666666667, "ndcg_at_100": 0.38515666666666665, "ndcg_at_1000": 0.4113791666666667, "ndcg_at_3": 0.28687749999999995, "ndcg_at_5": 0.3084766666666667, "precision_at_1": 0.24402583333333333, "precision_at_10": 0.05943749999999999, "precision_at_100": 0.010098333333333334, "precision_at_1000": 0.0014183333333333333, "precision_at_3": 0.132115, "precision_at_5": 0.09548416666666668, "recall_at_1": 0.2067566666666667, "recall_at_10": 0.4424558333333334, "recall_at_100": 0.6731116666666667, "recall_at_1000": 0.8587841666666666, "recall_at_3": 0.3149258333333333, "recall_at_5": 0.3693241666666667}}
|
evaluation/mteb/CQADupstackStatsRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 1614.26,
|
| 6 |
+
"map_at_1": 0.1834,
|
| 7 |
+
"map_at_10": 0.23988,
|
| 8 |
+
"map_at_100": 0.24895,
|
| 9 |
+
"map_at_1000": 0.24992,
|
| 10 |
+
"map_at_3": 0.21831,
|
| 11 |
+
"map_at_5": 0.23,
|
| 12 |
+
"mrr_at_1": 0.20399,
|
| 13 |
+
"mrr_at_10": 0.26186,
|
| 14 |
+
"mrr_at_100": 0.27018,
|
| 15 |
+
"mrr_at_1000": 0.27091,
|
| 16 |
+
"mrr_at_3": 0.2408,
|
| 17 |
+
"mrr_at_5": 0.2523,
|
| 18 |
+
"ndcg_at_1": 0.20399,
|
| 19 |
+
"ndcg_at_10": 0.27799,
|
| 20 |
+
"ndcg_at_100": 0.32579,
|
| 21 |
+
"ndcg_at_1000": 0.35209,
|
| 22 |
+
"ndcg_at_3": 0.23684,
|
| 23 |
+
"ndcg_at_5": 0.25521,
|
| 24 |
+
"precision_at_1": 0.20399,
|
| 25 |
+
"precision_at_10": 0.04586,
|
| 26 |
+
"precision_at_100": 0.00755,
|
| 27 |
+
"precision_at_1000": 0.00105,
|
| 28 |
+
"precision_at_3": 0.10276,
|
| 29 |
+
"precision_at_5": 0.07362,
|
| 30 |
+
"recall_at_1": 0.1834,
|
| 31 |
+
"recall_at_10": 0.37456,
|
| 32 |
+
"recall_at_100": 0.5986,
|
| 33 |
+
"recall_at_1000": 0.79703,
|
| 34 |
+
"recall_at_3": 0.26164,
|
| 35 |
+
"recall_at_5": 0.30652
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackTexRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 2711.63,
|
| 6 |
+
"map_at_1": 0.12327,
|
| 7 |
+
"map_at_10": 0.17572,
|
| 8 |
+
"map_at_100": 0.18534,
|
| 9 |
+
"map_at_1000": 0.18653,
|
| 10 |
+
"map_at_3": 0.15703,
|
| 11 |
+
"map_at_5": 0.16752,
|
| 12 |
+
"mrr_at_1": 0.15038,
|
| 13 |
+
"mrr_at_10": 0.20726,
|
| 14 |
+
"mrr_at_100": 0.2161,
|
| 15 |
+
"mrr_at_1000": 0.21695,
|
| 16 |
+
"mrr_at_3": 0.18829,
|
| 17 |
+
"mrr_at_5": 0.19885,
|
| 18 |
+
"ndcg_at_1": 0.15038,
|
| 19 |
+
"ndcg_at_10": 0.21241,
|
| 20 |
+
"ndcg_at_100": 0.26179,
|
| 21 |
+
"ndcg_at_1000": 0.29316,
|
| 22 |
+
"ndcg_at_3": 0.17762,
|
| 23 |
+
"ndcg_at_5": 0.19413,
|
| 24 |
+
"precision_at_1": 0.15038,
|
| 25 |
+
"precision_at_10": 0.03892,
|
| 26 |
+
"precision_at_100": 0.0075,
|
| 27 |
+
"precision_at_1000": 0.00118,
|
| 28 |
+
"precision_at_3": 0.08351,
|
| 29 |
+
"precision_at_5": 0.06187,
|
| 30 |
+
"recall_at_1": 0.12327,
|
| 31 |
+
"recall_at_10": 0.29342,
|
| 32 |
+
"recall_at_100": 0.51854,
|
| 33 |
+
"recall_at_1000": 0.74648,
|
| 34 |
+
"recall_at_3": 0.19596,
|
| 35 |
+
"recall_at_5": 0.23899
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackUnixRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 1688.62,
|
| 6 |
+
"map_at_1": 0.20594,
|
| 7 |
+
"map_at_10": 0.27879,
|
| 8 |
+
"map_at_100": 0.28926,
|
| 9 |
+
"map_at_1000": 0.29041,
|
| 10 |
+
"map_at_3": 0.25669,
|
| 11 |
+
"map_at_5": 0.26774,
|
| 12 |
+
"mrr_at_1": 0.23694,
|
| 13 |
+
"mrr_at_10": 0.31335,
|
| 14 |
+
"mrr_at_100": 0.32218,
|
| 15 |
+
"mrr_at_1000": 0.32298,
|
| 16 |
+
"mrr_at_3": 0.2926,
|
| 17 |
+
"mrr_at_5": 0.30328,
|
| 18 |
+
"ndcg_at_1": 0.23694,
|
| 19 |
+
"ndcg_at_10": 0.32456,
|
| 20 |
+
"ndcg_at_100": 0.37667,
|
| 21 |
+
"ndcg_at_1000": 0.40571,
|
| 22 |
+
"ndcg_at_3": 0.28283,
|
| 23 |
+
"ndcg_at_5": 0.29986,
|
| 24 |
+
"precision_at_1": 0.23694,
|
| 25 |
+
"precision_at_10": 0.05448,
|
| 26 |
+
"precision_at_100": 0.00912,
|
| 27 |
+
"precision_at_1000": 0.00127,
|
| 28 |
+
"precision_at_3": 0.12718,
|
| 29 |
+
"precision_at_5": 0.08843,
|
| 30 |
+
"recall_at_1": 0.20594,
|
| 31 |
+
"recall_at_10": 0.43005,
|
| 32 |
+
"recall_at_100": 0.66228,
|
| 33 |
+
"recall_at_1000": 0.87171,
|
| 34 |
+
"recall_at_3": 0.31554,
|
| 35 |
+
"recall_at_5": 0.35838
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackWebmastersRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 540.56,
|
| 6 |
+
"map_at_1": 0.20856,
|
| 7 |
+
"map_at_10": 0.28372,
|
| 8 |
+
"map_at_100": 0.2987,
|
| 9 |
+
"map_at_1000": 0.30075,
|
| 10 |
+
"map_at_3": 0.26054,
|
| 11 |
+
"map_at_5": 0.27129,
|
| 12 |
+
"mrr_at_1": 0.25494,
|
| 13 |
+
"mrr_at_10": 0.32735,
|
| 14 |
+
"mrr_at_100": 0.33794,
|
| 15 |
+
"mrr_at_1000": 0.3385,
|
| 16 |
+
"mrr_at_3": 0.30731,
|
| 17 |
+
"mrr_at_5": 0.31897,
|
| 18 |
+
"ndcg_at_1": 0.25494,
|
| 19 |
+
"ndcg_at_10": 0.33385,
|
| 20 |
+
"ndcg_at_100": 0.39436,
|
| 21 |
+
"ndcg_at_1000": 0.42313,
|
| 22 |
+
"ndcg_at_3": 0.29612,
|
| 23 |
+
"ndcg_at_5": 0.31187,
|
| 24 |
+
"precision_at_1": 0.25494,
|
| 25 |
+
"precision_at_10": 0.06423,
|
| 26 |
+
"precision_at_100": 0.01383,
|
| 27 |
+
"precision_at_1000": 0.00224,
|
| 28 |
+
"precision_at_3": 0.13834,
|
| 29 |
+
"precision_at_5": 0.1,
|
| 30 |
+
"recall_at_1": 0.20856,
|
| 31 |
+
"recall_at_10": 0.42678,
|
| 32 |
+
"recall_at_100": 0.70224,
|
| 33 |
+
"recall_at_1000": 0.89369,
|
| 34 |
+
"recall_at_3": 0.31957,
|
| 35 |
+
"recall_at_5": 0.36026
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/CQADupstackWordpressRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 1798.61,
|
| 6 |
+
"map_at_1": 0.16519,
|
| 7 |
+
"map_at_10": 0.2215,
|
| 8 |
+
"map_at_100": 0.23181,
|
| 9 |
+
"map_at_1000": 0.23292,
|
| 10 |
+
"map_at_3": 0.20132,
|
| 11 |
+
"map_at_5": 0.21346,
|
| 12 |
+
"mrr_at_1": 0.1793,
|
| 13 |
+
"mrr_at_10": 0.23506,
|
| 14 |
+
"mrr_at_100": 0.24581,
|
| 15 |
+
"mrr_at_1000": 0.24675,
|
| 16 |
+
"mrr_at_3": 0.21503,
|
| 17 |
+
"mrr_at_5": 0.22686,
|
| 18 |
+
"ndcg_at_1": 0.1793,
|
| 19 |
+
"ndcg_at_10": 0.25636,
|
| 20 |
+
"ndcg_at_100": 0.30736,
|
| 21 |
+
"ndcg_at_1000": 0.33841,
|
| 22 |
+
"ndcg_at_3": 0.21546,
|
| 23 |
+
"ndcg_at_5": 0.23658,
|
| 24 |
+
"precision_at_1": 0.1793,
|
| 25 |
+
"precision_at_10": 0.03993,
|
| 26 |
+
"precision_at_100": 0.00689,
|
| 27 |
+
"precision_at_1000": 0.00104,
|
| 28 |
+
"precision_at_3": 0.09057,
|
| 29 |
+
"precision_at_5": 0.0658,
|
| 30 |
+
"recall_at_1": 0.16519,
|
| 31 |
+
"recall_at_10": 0.35268,
|
| 32 |
+
"recall_at_100": 0.5817,
|
| 33 |
+
"recall_at_1000": 0.81668,
|
| 34 |
+
"recall_at_3": 0.24165,
|
| 35 |
+
"recall_at_5": 0.29254
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/ClimateFEVER.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 16391.42,
|
| 6 |
+
"map_at_1": 0.10363,
|
| 7 |
+
"map_at_10": 0.18301,
|
| 8 |
+
"map_at_100": 0.20019,
|
| 9 |
+
"map_at_1000": 0.20207,
|
| 10 |
+
"map_at_3": 0.14877,
|
| 11 |
+
"map_at_5": 0.16544,
|
| 12 |
+
"mrr_at_1": 0.22866,
|
| 13 |
+
"mrr_at_10": 0.34935,
|
| 14 |
+
"mrr_at_100": 0.35802,
|
| 15 |
+
"mrr_at_1000": 0.3584,
|
| 16 |
+
"mrr_at_3": 0.30966,
|
| 17 |
+
"mrr_at_5": 0.33204,
|
| 18 |
+
"ndcg_at_1": 0.22866,
|
| 19 |
+
"ndcg_at_10": 0.26595,
|
| 20 |
+
"ndcg_at_100": 0.33514,
|
| 21 |
+
"ndcg_at_1000": 0.36872,
|
| 22 |
+
"ndcg_at_3": 0.20667,
|
| 23 |
+
"ndcg_at_5": 0.22728,
|
| 24 |
+
"precision_at_1": 0.22866,
|
| 25 |
+
"precision_at_10": 0.08632,
|
| 26 |
+
"precision_at_100": 0.01612,
|
| 27 |
+
"precision_at_1000": 0.00224,
|
| 28 |
+
"precision_at_3": 0.15505,
|
| 29 |
+
"precision_at_5": 0.12404,
|
| 30 |
+
"recall_at_1": 0.10363,
|
| 31 |
+
"recall_at_10": 0.33494,
|
| 32 |
+
"recall_at_100": 0.57593,
|
| 33 |
+
"recall_at_1000": 0.76342,
|
| 34 |
+
"recall_at_3": 0.19157,
|
| 35 |
+
"recall_at_5": 0.24638
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/DBPedia.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 11184.99,
|
| 6 |
+
"map_at_1": 0.07436,
|
| 7 |
+
"map_at_10": 0.1476,
|
| 8 |
+
"map_at_100": 0.19206,
|
| 9 |
+
"map_at_1000": 0.20267,
|
| 10 |
+
"map_at_3": 0.10894,
|
| 11 |
+
"map_at_5": 0.12829,
|
| 12 |
+
"mrr_at_1": 0.5425,
|
| 13 |
+
"mrr_at_10": 0.63769,
|
| 14 |
+
"mrr_at_100": 0.64193,
|
| 15 |
+
"mrr_at_1000": 0.64211,
|
| 16 |
+
"mrr_at_3": 0.61458,
|
| 17 |
+
"mrr_at_5": 0.63096,
|
| 18 |
+
"ndcg_at_1": 0.42875,
|
| 19 |
+
"ndcg_at_10": 0.31507,
|
| 20 |
+
"ndcg_at_100": 0.34559,
|
| 21 |
+
"ndcg_at_1000": 0.41246,
|
| 22 |
+
"ndcg_at_3": 0.35058,
|
| 23 |
+
"ndcg_at_5": 0.33396,
|
| 24 |
+
"precision_at_1": 0.5425,
|
| 25 |
+
"precision_at_10": 0.2445,
|
| 26 |
+
"precision_at_100": 0.07383,
|
| 27 |
+
"precision_at_1000": 0.01582,
|
| 28 |
+
"precision_at_3": 0.38083,
|
| 29 |
+
"precision_at_5": 0.326,
|
| 30 |
+
"recall_at_1": 0.07436,
|
| 31 |
+
"recall_at_10": 0.19862,
|
| 32 |
+
"recall_at_100": 0.38981,
|
| 33 |
+
"recall_at_1000": 0.61038,
|
| 34 |
+
"recall_at_3": 0.11949,
|
| 35 |
+
"recall_at_5": 0.15562
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/EmotionClassification.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"accuracy": 0.46390000000000003,
|
| 6 |
+
"accuracy_stderr": 0.018785366645343925,
|
| 7 |
+
"evaluation_time": 31.09,
|
| 8 |
+
"f1": 0.42264248858567033,
|
| 9 |
+
"f1_stderr": 0.011565342464001555,
|
| 10 |
+
"main_score": 0.46390000000000003
|
| 11 |
+
}
|
| 12 |
+
}
|
evaluation/mteb/FEVER.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 17506.78,
|
| 6 |
+
"map_at_1": 0.50916,
|
| 7 |
+
"map_at_10": 0.62258,
|
| 8 |
+
"map_at_100": 0.62741,
|
| 9 |
+
"map_at_1000": 0.62763,
|
| 10 |
+
"map_at_3": 0.60018,
|
| 11 |
+
"map_at_5": 0.6142,
|
| 12 |
+
"mrr_at_1": 0.54965,
|
| 13 |
+
"mrr_at_10": 0.66554,
|
| 14 |
+
"mrr_at_100": 0.66966,
|
| 15 |
+
"mrr_at_1000": 0.66978,
|
| 16 |
+
"mrr_at_3": 0.64414,
|
| 17 |
+
"mrr_at_5": 0.6577,
|
| 18 |
+
"ndcg_at_1": 0.54965,
|
| 19 |
+
"ndcg_at_10": 0.6812,
|
| 20 |
+
"ndcg_at_100": 0.70282,
|
| 21 |
+
"ndcg_at_1000": 0.70788,
|
| 22 |
+
"ndcg_at_3": 0.63862,
|
| 23 |
+
"ndcg_at_5": 0.66216,
|
| 24 |
+
"precision_at_1": 0.54965,
|
| 25 |
+
"precision_at_10": 0.08998,
|
| 26 |
+
"precision_at_100": 0.01016,
|
| 27 |
+
"precision_at_1000": 0.00107,
|
| 28 |
+
"precision_at_3": 0.25618,
|
| 29 |
+
"precision_at_5": 0.16676,
|
| 30 |
+
"recall_at_1": 0.50916,
|
| 31 |
+
"recall_at_10": 0.8204,
|
| 32 |
+
"recall_at_100": 0.91689,
|
| 33 |
+
"recall_at_1000": 0.95349,
|
| 34 |
+
"recall_at_3": 0.70512,
|
| 35 |
+
"recall_at_5": 0.76299
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/FiQA2018.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 310.86,
|
| 6 |
+
"map_at_1": 0.13568,
|
| 7 |
+
"map_at_10": 0.23264,
|
| 8 |
+
"map_at_100": 0.24824,
|
| 9 |
+
"map_at_1000": 0.25014,
|
| 10 |
+
"map_at_3": 0.19724,
|
| 11 |
+
"map_at_5": 0.21772,
|
| 12 |
+
"mrr_at_1": 0.27315,
|
| 13 |
+
"mrr_at_10": 0.35935,
|
| 14 |
+
"mrr_at_100": 0.36929,
|
| 15 |
+
"mrr_at_1000": 0.36985,
|
| 16 |
+
"mrr_at_3": 0.33591,
|
| 17 |
+
"mrr_at_5": 0.34848,
|
| 18 |
+
"ndcg_at_1": 0.27315,
|
| 19 |
+
"ndcg_at_10": 0.29988,
|
| 20 |
+
"ndcg_at_100": 0.3641,
|
| 21 |
+
"ndcg_at_1000": 0.40185,
|
| 22 |
+
"ndcg_at_3": 0.26342,
|
| 23 |
+
"ndcg_at_5": 0.2768,
|
| 24 |
+
"precision_at_1": 0.27315,
|
| 25 |
+
"precision_at_10": 0.08565,
|
| 26 |
+
"precision_at_100": 0.01508,
|
| 27 |
+
"precision_at_1000": 0.00219,
|
| 28 |
+
"precision_at_3": 0.1785,
|
| 29 |
+
"precision_at_5": 0.13673,
|
| 30 |
+
"recall_at_1": 0.13568,
|
| 31 |
+
"recall_at_10": 0.37133,
|
| 32 |
+
"recall_at_100": 0.61475,
|
| 33 |
+
"recall_at_1000": 0.84372,
|
| 34 |
+
"recall_at_3": 0.24112,
|
| 35 |
+
"recall_at_5": 0.29507
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/HotpotQA.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 13678.13,
|
| 6 |
+
"map_at_1": 0.30878,
|
| 7 |
+
"map_at_10": 0.40868,
|
| 8 |
+
"map_at_100": 0.41694,
|
| 9 |
+
"map_at_1000": 0.41775,
|
| 10 |
+
"map_at_3": 0.3856,
|
| 11 |
+
"map_at_5": 0.39947,
|
| 12 |
+
"mrr_at_1": 0.61756,
|
| 13 |
+
"mrr_at_10": 0.68265,
|
| 14 |
+
"mrr_at_100": 0.68671,
|
| 15 |
+
"mrr_at_1000": 0.68694,
|
| 16 |
+
"mrr_at_3": 0.66784,
|
| 17 |
+
"mrr_at_5": 0.67704,
|
| 18 |
+
"ndcg_at_1": 0.61756,
|
| 19 |
+
"ndcg_at_10": 0.49931,
|
| 20 |
+
"ndcg_at_100": 0.53179,
|
| 21 |
+
"ndcg_at_1000": 0.54948,
|
| 22 |
+
"ndcg_at_3": 0.46103,
|
| 23 |
+
"ndcg_at_5": 0.48147,
|
| 24 |
+
"precision_at_1": 0.61756,
|
| 25 |
+
"precision_at_10": 0.10163,
|
| 26 |
+
"precision_at_100": 0.01271,
|
| 27 |
+
"precision_at_1000": 0.00151,
|
| 28 |
+
"precision_at_3": 0.28179,
|
| 29 |
+
"precision_at_5": 0.18528,
|
| 30 |
+
"recall_at_1": 0.30878,
|
| 31 |
+
"recall_at_10": 0.50817,
|
| 32 |
+
"recall_at_100": 0.63545,
|
| 33 |
+
"recall_at_1000": 0.75361,
|
| 34 |
+
"recall_at_3": 0.42269,
|
| 35 |
+
"recall_at_5": 0.4632
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/ImdbClassification.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"accuracy": 0.6404799999999999,
|
| 6 |
+
"accuracy_stderr": 0.03197141223030349,
|
| 7 |
+
"ap": 0.5918525145533928,
|
| 8 |
+
"ap_stderr": 0.024531019346391677,
|
| 9 |
+
"evaluation_time": 915.58,
|
| 10 |
+
"f1": 0.6394712318134925,
|
| 11 |
+
"f1_stderr": 0.0317267000377415,
|
| 12 |
+
"main_score": 0.6404799999999999
|
| 13 |
+
}
|
| 14 |
+
}
|
evaluation/mteb/MSMARCO.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"validation": {
|
| 5 |
+
"evaluation_time": 22861.03,
|
| 6 |
+
"map_at_1": 0.189,
|
| 7 |
+
"map_at_10": 0.29748,
|
| 8 |
+
"map_at_100": 0.30976,
|
| 9 |
+
"map_at_1000": 0.31041,
|
| 10 |
+
"map_at_3": 0.26113,
|
| 11 |
+
"map_at_5": 0.28197,
|
| 12 |
+
"mrr_at_1": 0.19413,
|
| 13 |
+
"mrr_at_10": 0.30322,
|
| 14 |
+
"mrr_at_100": 0.31497,
|
| 15 |
+
"mrr_at_1000": 0.31555,
|
| 16 |
+
"mrr_at_3": 0.26729,
|
| 17 |
+
"mrr_at_5": 0.28789,
|
| 18 |
+
"ndcg_at_1": 0.19413,
|
| 19 |
+
"ndcg_at_10": 0.36048,
|
| 20 |
+
"ndcg_at_100": 0.42152,
|
| 21 |
+
"ndcg_at_1000": 0.43772,
|
| 22 |
+
"ndcg_at_3": 0.28642,
|
| 23 |
+
"ndcg_at_5": 0.32358,
|
| 24 |
+
"precision_at_1": 0.19413,
|
| 25 |
+
"precision_at_10": 0.05785,
|
| 26 |
+
"precision_at_100": 0.00887,
|
| 27 |
+
"precision_at_1000": 0.00103,
|
| 28 |
+
"precision_at_3": 0.12192,
|
| 29 |
+
"precision_at_5": 0.09189,
|
| 30 |
+
"recall_at_1": 0.189,
|
| 31 |
+
"recall_at_10": 0.55457,
|
| 32 |
+
"recall_at_100": 0.84091,
|
| 33 |
+
"recall_at_1000": 0.96482,
|
| 34 |
+
"recall_at_3": 0.35359,
|
| 35 |
+
"recall_at_5": 0.44275
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/MTOPDomainClassification.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"en": {
|
| 6 |
+
"accuracy": 0.9207706338349293,
|
| 7 |
+
"accuracy_stderr": 0.005541106237593856,
|
| 8 |
+
"f1": 0.9156680443236652,
|
| 9 |
+
"f1_stderr": 0.005216941657420623,
|
| 10 |
+
"main_score": 0.9207706338349293
|
| 11 |
+
},
|
| 12 |
+
"evaluation_time": 31.37
|
| 13 |
+
}
|
| 14 |
+
}
|
evaluation/mteb/MTOPIntentClassification.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"en": {
|
| 6 |
+
"accuracy": 0.7118559051527589,
|
| 7 |
+
"accuracy_stderr": 0.012419016906278644,
|
| 8 |
+
"f1": 0.5242887061726789,
|
| 9 |
+
"f1_stderr": 0.011199354119349208,
|
| 10 |
+
"main_score": 0.7118559051527589
|
| 11 |
+
},
|
| 12 |
+
"evaluation_time": 82.02
|
| 13 |
+
}
|
| 14 |
+
}
|
evaluation/mteb/MassiveIntentClassification.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"en": {
|
| 6 |
+
"accuracy": 0.6864828513786148,
|
| 7 |
+
"accuracy_stderr": 0.012244395475104431,
|
| 8 |
+
"f1": 0.6654281381596097,
|
| 9 |
+
"f1_stderr": 0.009337695311493243,
|
| 10 |
+
"main_score": 0.6864828513786148
|
| 11 |
+
},
|
| 12 |
+
"evaluation_time": 49.93
|
| 13 |
+
}
|
| 14 |
+
}
|
evaluation/mteb/MassiveScenarioClassification.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"en": {
|
| 6 |
+
"accuracy": 0.7604236718224613,
|
| 7 |
+
"accuracy_stderr": 0.009702648067132833,
|
| 8 |
+
"f1": 0.7589170458655639,
|
| 9 |
+
"f1_stderr": 0.009666037600064457,
|
| 10 |
+
"main_score": 0.7604236718224613
|
| 11 |
+
},
|
| 12 |
+
"evaluation_time": 29.65
|
| 13 |
+
}
|
| 14 |
+
}
|
evaluation/mteb/MedrxivClusteringP2P.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 1694.42,
|
| 6 |
+
"v_measure": 0.320840369055247,
|
| 7 |
+
"v_measure_std": 0.012975340075124157
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/MedrxivClusteringS2S.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 258.59,
|
| 6 |
+
"v_measure": 0.29448729560244535,
|
| 7 |
+
"v_measure_std": 0.014610308837145732
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/MindSmallReranking.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 18115.54,
|
| 6 |
+
"map": 0.31340856463122374,
|
| 7 |
+
"mrr": 0.32398547669840916
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/NFCorpus.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 101.25,
|
| 6 |
+
"map_at_1": 0.05526,
|
| 7 |
+
"map_at_10": 0.11745,
|
| 8 |
+
"map_at_100": 0.14831,
|
| 9 |
+
"map_at_1000": 0.16235,
|
| 10 |
+
"map_at_3": 0.08716,
|
| 11 |
+
"map_at_5": 0.10101,
|
| 12 |
+
"mrr_at_1": 0.43653,
|
| 13 |
+
"mrr_at_10": 0.51067,
|
| 14 |
+
"mrr_at_100": 0.51881,
|
| 15 |
+
"mrr_at_1000": 0.51912,
|
| 16 |
+
"mrr_at_3": 0.4902,
|
| 17 |
+
"mrr_at_5": 0.50289,
|
| 18 |
+
"ndcg_at_1": 0.4195,
|
| 19 |
+
"ndcg_at_10": 0.32083,
|
| 20 |
+
"ndcg_at_100": 0.3005,
|
| 21 |
+
"ndcg_at_1000": 0.38661,
|
| 22 |
+
"ndcg_at_3": 0.3794,
|
| 23 |
+
"ndcg_at_5": 0.35456,
|
| 24 |
+
"precision_at_1": 0.43344,
|
| 25 |
+
"precision_at_10": 0.23437,
|
| 26 |
+
"precision_at_100": 0.0783,
|
| 27 |
+
"precision_at_1000": 0.02053,
|
| 28 |
+
"precision_at_3": 0.35501,
|
| 29 |
+
"precision_at_5": 0.30464,
|
| 30 |
+
"recall_at_1": 0.05526,
|
| 31 |
+
"recall_at_10": 0.15446,
|
| 32 |
+
"recall_at_100": 0.31179,
|
| 33 |
+
"recall_at_1000": 0.61578,
|
| 34 |
+
"recall_at_3": 0.0971,
|
| 35 |
+
"recall_at_5": 0.12026
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/NQ.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 8091.11,
|
| 6 |
+
"map_at_1": 0.23467,
|
| 7 |
+
"map_at_10": 0.36041,
|
| 8 |
+
"map_at_100": 0.37268,
|
| 9 |
+
"map_at_1000": 0.37322,
|
| 10 |
+
"map_at_3": 0.3209,
|
| 11 |
+
"map_at_5": 0.34414,
|
| 12 |
+
"mrr_at_1": 0.26738,
|
| 13 |
+
"mrr_at_10": 0.38665,
|
| 14 |
+
"mrr_at_100": 0.3964,
|
| 15 |
+
"mrr_at_1000": 0.39681,
|
| 16 |
+
"mrr_at_3": 0.35207,
|
| 17 |
+
"mrr_at_5": 0.3731,
|
| 18 |
+
"ndcg_at_1": 0.26709,
|
| 19 |
+
"ndcg_at_10": 0.42942,
|
| 20 |
+
"ndcg_at_100": 0.48296,
|
| 21 |
+
"ndcg_at_1000": 0.49651,
|
| 22 |
+
"ndcg_at_3": 0.35413,
|
| 23 |
+
"ndcg_at_5": 0.39368,
|
| 24 |
+
"precision_at_1": 0.26709,
|
| 25 |
+
"precision_at_10": 0.07306,
|
| 26 |
+
"precision_at_100": 0.01029,
|
| 27 |
+
"precision_at_1000": 0.00116,
|
| 28 |
+
"precision_at_3": 0.16348,
|
| 29 |
+
"precision_at_5": 0.12068,
|
| 30 |
+
"recall_at_1": 0.23467,
|
| 31 |
+
"recall_at_10": 0.61493,
|
| 32 |
+
"recall_at_100": 0.85011,
|
| 33 |
+
"recall_at_1000": 0.95261,
|
| 34 |
+
"recall_at_3": 0.41952,
|
| 35 |
+
"recall_at_5": 0.51106
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/QuoraRetrieval.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 742.32,
|
| 6 |
+
"map_at_1": 0.67517,
|
| 7 |
+
"map_at_10": 0.81054,
|
| 8 |
+
"map_at_100": 0.81727,
|
| 9 |
+
"map_at_1000": 0.81752,
|
| 10 |
+
"map_at_3": 0.78018,
|
| 11 |
+
"map_at_5": 0.79879,
|
| 12 |
+
"mrr_at_1": 0.7752,
|
| 13 |
+
"mrr_at_10": 0.84429,
|
| 14 |
+
"mrr_at_100": 0.84582,
|
| 15 |
+
"mrr_at_1000": 0.84584,
|
| 16 |
+
"mrr_at_3": 0.83268,
|
| 17 |
+
"mrr_at_5": 0.84013,
|
| 18 |
+
"ndcg_at_1": 0.7753,
|
| 19 |
+
"ndcg_at_10": 0.85277,
|
| 20 |
+
"ndcg_at_100": 0.86805,
|
| 21 |
+
"ndcg_at_1000": 0.8701,
|
| 22 |
+
"ndcg_at_3": 0.81975,
|
| 23 |
+
"ndcg_at_5": 0.83723,
|
| 24 |
+
"precision_at_1": 0.7753,
|
| 25 |
+
"precision_at_10": 0.12961,
|
| 26 |
+
"precision_at_100": 0.01502,
|
| 27 |
+
"precision_at_1000": 0.00156,
|
| 28 |
+
"precision_at_3": 0.35713,
|
| 29 |
+
"precision_at_5": 0.23574,
|
| 30 |
+
"recall_at_1": 0.67517,
|
| 31 |
+
"recall_at_10": 0.93486,
|
| 32 |
+
"recall_at_100": 0.989,
|
| 33 |
+
"recall_at_1000": 0.9993,
|
| 34 |
+
"recall_at_3": 0.8418,
|
| 35 |
+
"recall_at_5": 0.88975
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/RedditClustering.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 3324.44,
|
| 6 |
+
"v_measure": 0.48225994608749917,
|
| 7 |
+
"v_measure_std": 0.055941572162319216
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/RedditClusteringP2P.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 13390.64,
|
| 6 |
+
"v_measure": 0.5317635557157765,
|
| 7 |
+
"v_measure_std": 0.12570620726605897
|
| 8 |
+
}
|
| 9 |
+
}
|
evaluation/mteb/SCIDOCS.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"evaluation_time": 214.39,
|
| 6 |
+
"map_at_1": 0.03988,
|
| 7 |
+
"map_at_10": 0.094,
|
| 8 |
+
"map_at_100": 0.10968,
|
| 9 |
+
"map_at_1000": 0.11257,
|
| 10 |
+
"map_at_3": 0.07123,
|
| 11 |
+
"map_at_5": 0.08221,
|
| 12 |
+
"mrr_at_1": 0.197,
|
| 13 |
+
"mrr_at_10": 0.29098,
|
| 14 |
+
"mrr_at_100": 0.30247,
|
| 15 |
+
"mrr_at_1000": 0.30318,
|
| 16 |
+
"mrr_at_3": 0.2655,
|
| 17 |
+
"mrr_at_5": 0.27915,
|
| 18 |
+
"ndcg_at_1": 0.197,
|
| 19 |
+
"ndcg_at_10": 0.16176,
|
| 20 |
+
"ndcg_at_100": 0.22931,
|
| 21 |
+
"ndcg_at_1000": 0.28301,
|
| 22 |
+
"ndcg_at_3": 0.16142,
|
| 23 |
+
"ndcg_at_5": 0.13634,
|
| 24 |
+
"precision_at_1": 0.197,
|
| 25 |
+
"precision_at_10": 0.0818,
|
| 26 |
+
"precision_at_100": 0.01801,
|
| 27 |
+
"precision_at_1000": 0.00309,
|
| 28 |
+
"precision_at_3": 0.151,
|
| 29 |
+
"precision_at_5": 0.1174,
|
| 30 |
+
"recall_at_1": 0.03988,
|
| 31 |
+
"recall_at_10": 0.16625,
|
| 32 |
+
"recall_at_100": 0.3661,
|
| 33 |
+
"recall_at_1000": 0.62805,
|
| 34 |
+
"recall_at_3": 0.09168,
|
| 35 |
+
"recall_at_5": 0.11902
|
| 36 |
+
}
|
| 37 |
+
}
|
evaluation/mteb/SGPT-1.3B-weightedmean-msmarco-specb-bitfit_results.csv
ADDED
|
@@ -0,0 +1,355 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model,task,dataset,language,metric,value
|
| 2 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,BitextMining,BUCC,,f1,
|
| 3 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,BitextMining,Tatoeba,,f1,
|
| 4 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en,accuracy,0.652089552238806
|
| 5 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
|
| 6 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
|
| 7 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
|
| 8 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
|
| 9 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
|
| 10 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
|
| 11 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonPolarityClassification,en,accuracy,0.7320565
|
| 12 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,en,accuracy,0.34956
|
| 13 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
|
| 14 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
|
| 15 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
|
| 16 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
|
| 17 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
|
| 18 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
|
| 19 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
|
| 20 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
|
| 21 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
|
| 22 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
|
| 23 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,Banking77Classification,en,accuracy,0.8205844155844156
|
| 24 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,EmotionClassification,en,accuracy,0.46390000000000003
|
| 25 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,ImdbClassification,en,accuracy,0.6404799999999999
|
| 26 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
|
| 27 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
|
| 28 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
|
| 29 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
|
| 30 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
|
| 31 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
|
| 32 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
|
| 33 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
|
| 34 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
|
| 35 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
|
| 36 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
|
| 37 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
|
| 38 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
|
| 39 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
|
| 40 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
|
| 41 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
|
| 42 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
|
| 43 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
|
| 44 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,en,accuracy,0.6864828513786148
|
| 45 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
|
| 46 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
|
| 47 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
|
| 48 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
|
| 49 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
|
| 50 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
|
| 51 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
|
| 52 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
|
| 53 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
|
| 54 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
|
| 55 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
|
| 56 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
|
| 57 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
|
| 58 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
|
| 59 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
|
| 60 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
|
| 61 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
|
| 62 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
|
| 63 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
|
| 64 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
|
| 65 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
|
| 66 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
|
| 67 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
|
| 68 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
|
| 69 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
|
| 70 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
|
| 71 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
|
| 72 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
|
| 73 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
|
| 74 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
|
| 75 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
|
| 76 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
|
| 77 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
|
| 78 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
|
| 79 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
|
| 80 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
|
| 81 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
|
| 82 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
|
| 83 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
|
| 84 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
|
| 85 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
|
| 86 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
|
| 87 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
|
| 88 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
|
| 89 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
|
| 90 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
|
| 91 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
|
| 92 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
|
| 93 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
|
| 94 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
|
| 95 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
|
| 96 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
|
| 97 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
|
| 98 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
|
| 99 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
|
| 100 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
|
| 101 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
|
| 102 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
|
| 103 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
|
| 104 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
|
| 105 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
|
| 106 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
|
| 107 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
|
| 108 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
|
| 109 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
|
| 110 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
|
| 111 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
|
| 112 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
|
| 113 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
|
| 114 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
|
| 115 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
|
| 116 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
|
| 117 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
|
| 118 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
|
| 119 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
|
| 120 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
|
| 121 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
|
| 122 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
|
| 123 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
|
| 124 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
|
| 125 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
|
| 126 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
|
| 127 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
|
| 128 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
|
| 129 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
|
| 130 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
|
| 131 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
|
| 132 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
|
| 133 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
|
| 134 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
|
| 135 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
|
| 136 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
|
| 137 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
|
| 138 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
|
| 139 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
|
| 140 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
|
| 141 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
|
| 142 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
|
| 143 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
|
| 144 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
|
| 145 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,en,accuracy,0.7604236718224613
|
| 146 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
|
| 147 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
|
| 148 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
|
| 149 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
|
| 150 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
|
| 151 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
|
| 152 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
|
| 153 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
|
| 154 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
|
| 155 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
|
| 156 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
|
| 157 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
|
| 158 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
|
| 159 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
|
| 160 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
|
| 161 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
|
| 162 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
|
| 163 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
|
| 164 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
|
| 165 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
|
| 166 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
|
| 167 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
|
| 168 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
|
| 169 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
|
| 170 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
|
| 171 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
|
| 172 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
|
| 173 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
|
| 174 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
|
| 175 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
|
| 176 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
|
| 177 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
|
| 178 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
|
| 179 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
|
| 180 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
|
| 181 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
|
| 182 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
|
| 183 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
|
| 184 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
|
| 185 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
|
| 186 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
|
| 187 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
|
| 188 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
|
| 189 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
|
| 190 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
|
| 191 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
|
| 192 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
|
| 193 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
|
| 194 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
|
| 195 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
|
| 196 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
|
| 197 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
|
| 198 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
|
| 199 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
|
| 200 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
|
| 201 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
|
| 202 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
|
| 203 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
|
| 204 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
|
| 205 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
|
| 206 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
|
| 207 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
|
| 208 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
|
| 209 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
|
| 210 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
|
| 211 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
|
| 212 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
|
| 213 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
|
| 214 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
|
| 215 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
|
| 216 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
|
| 217 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
|
| 218 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
|
| 219 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
|
| 220 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
|
| 221 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
|
| 222 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
|
| 223 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
|
| 224 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
|
| 225 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
|
| 226 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
|
| 227 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
|
| 228 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,en,accuracy,0.9207706338349293
|
| 229 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
|
| 230 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
|
| 231 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
|
| 232 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
|
| 233 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
|
| 234 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
|
| 235 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
|
| 236 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
|
| 237 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
|
| 238 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
|
| 239 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,en,accuracy,0.7118559051527589
|
| 240 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
|
| 241 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
|
| 242 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
|
| 243 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
|
| 244 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
|
| 245 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
|
| 246 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
|
| 247 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
|
| 248 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
|
| 249 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
|
| 250 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,ToxicConversationsClassification,en,accuracy,0.687272
|
| 251 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,TweetSentimentExtractionClassification,en,accuracy,0.556677985285795
|
| 252 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringP2P,en,v_measure,0.4338419491695377
|
| 253 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringS2S,en,v_measure,0.3370962633433912
|
| 254 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringP2P,en,v_measure,0.3505918333141837
|
| 255 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringS2S,en,v_measure,0.3071055028830579
|
| 256 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringP2P,en,v_measure,0.320840369055247
|
| 257 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringS2S,en,v_measure,0.29448729560244535
|
| 258 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClustering,en,v_measure,0.48225994608749917
|
| 259 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClusteringP2P,en,v_measure,0.5317635557157765
|
| 260 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClustering,en,v_measure,0.6085593925770172
|
| 261 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClusteringP2P,en,v_measure,0.323567729982375
|
| 262 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,TwentyNewsgroupsClustering,en,v_measure,0.4005809562275603
|
| 263 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,SprintDuplicateQuestions,en,ap,0.9257836032673468
|
| 264 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterSemEval2015,en,ap,0.6237052608803734
|
| 265 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterURLCorpus,en,ap,0.8378748636891035
|
| 266 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,AskUbuntuDupQuestions,en,map,0.5813305899687008
|
| 267 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,MindSmallReranking,en,map,0.31340856463122374
|
| 268 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,SciDocsRR,en,map,0.7721233007730808
|
| 269 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,StackOverflowDupQuestions,en,map,0.49320607035290737
|
| 270 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,ArguAna,en,ndcg_at_10,0.4968
|
| 271 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,ClimateFEVER,en,ndcg_at_10,0.26595
|
| 272 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,CQADupstackRetrieval,en,ndcg_at_10,0.3332616666666667
|
| 273 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,DBPedia,en,ndcg_at_10,0.31507
|
| 274 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,FEVER,en,ndcg_at_10,0.6812
|
| 275 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,FiQA2018,en,ndcg_at_10,0.29988
|
| 276 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,HotpotQA,en,ndcg_at_10,0.49931
|
| 277 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,MSMARCO,en,ndcg_at_10,0.36048
|
| 278 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,NFCorpus,en,ndcg_at_10,0.32083
|
| 279 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,NQ,en,ndcg_at_10,0.42942
|
| 280 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,QuoraRetrieval,en,ndcg_at_10,0.85277
|
| 281 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,SCIDOCS,en,ndcg_at_10,0.16176
|
| 282 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,SciFact,en,ndcg_at_10,0.68287
|
| 283 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,Touche2020,en,ndcg_at_10,0.2445
|
| 284 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,TRECCOVID,en,ndcg_at_10,0.7298
|
| 285 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,BIOSSES,en,cosine_spearman,0.8301514456843275
|
| 286 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,SICK-R,en,cosine_spearman,0.6722953551111448
|
| 287 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS12,en,cosine_spearman,0.6659241013465915
|
| 288 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS13,en,cosine_spearman,0.7733151317062642
|
| 289 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS14,en,cosine_spearman,0.7182815265534886
|
| 290 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS15,en,cosine_spearman,0.8065931167868883
|
| 291 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS16,en,cosine_spearman,0.7891151365939403
|
| 292 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
|
| 293 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
|
| 294 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
|
| 295 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
|
| 296 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
|
| 297 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
|
| 298 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
|
| 299 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
|
| 300 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-en,cosine_spearman,0.8698674844768606
|
| 301 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
|
| 302 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
|
| 303 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
|
| 304 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
|
| 305 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
|
| 306 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
|
| 307 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
|
| 308 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
|
| 309 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
|
| 310 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
|
| 311 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
|
| 312 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
|
| 313 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,en,cosine_spearman,0.6730387805090023
|
| 314 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
|
| 315 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
|
| 316 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
|
| 317 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
|
| 318 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
|
| 319 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
|
| 320 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
|
| 321 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
|
| 322 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
|
| 323 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
|
| 324 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
|
| 325 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
|
| 326 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
|
| 327 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
|
| 328 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
|
| 329 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
|
| 330 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
|
| 331 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
|
| 332 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
|
| 333 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
|
| 334 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
|
| 335 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
|
| 336 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
|
| 337 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
|
| 338 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
|
| 339 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
|
| 340 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
|
| 341 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
|
| 342 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
|
| 343 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
|
| 344 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
|
| 345 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
|
| 346 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
|
| 347 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
|
| 348 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,STSBenchmark,en,cosine_spearman,0.775887175717799
|
| 349 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Summarization,SummEval,en,cosine_spearman,0.25440272876996695
|
| 350 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Classification,average,en,accuracy,0.6651794596081484
|
| 351 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Clustering,average,en,v_measure,0.3991540721780082
|
| 352 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,PairClassification,average,en,ap,0.7957879092789413
|
| 353 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Reranking,average,en,map,0.5400171314314782
|
| 354 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,Retrieval,average,en,ndcg_at_10,0.4449267777777778
|
| 355 |
+
SGPT-1.3B-weightedmean-msmarco-specb-bitfit,STS,average,en,cosine_spearman,0.7574469254486307
|
evaluation/mteb/SICK-R.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"cos_sim": {
|
| 6 |
+
"pearson": 0.7729330379162072,
|
| 7 |
+
"spearman": 0.6722953551111448
|
| 8 |
+
},
|
| 9 |
+
"euclidean": {
|
| 10 |
+
"pearson": 0.7144682700059415,
|
| 11 |
+
"spearman": 0.6633178012153248
|
| 12 |
+
},
|
| 13 |
+
"evaluation_time": 52.38,
|
| 14 |
+
"manhattan": {
|
| 15 |
+
"pearson": 0.7146941734657887,
|
| 16 |
+
"spearman": 0.6643234359835815
|
| 17 |
+
}
|
| 18 |
+
}
|
| 19 |
+
}
|
evaluation/mteb/STS12.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"cos_sim": {
|
| 6 |
+
"pearson": 0.7540943196466576,
|
| 7 |
+
"spearman": 0.6659241013465915
|
| 8 |
+
},
|
| 9 |
+
"euclidean": {
|
| 10 |
+
"pearson": 0.7132500540796616,
|
| 11 |
+
"spearman": 0.6786667467202591
|
| 12 |
+
},
|
| 13 |
+
"evaluation_time": 26.18,
|
| 14 |
+
"manhattan": {
|
| 15 |
+
"pearson": 0.7148209832089134,
|
| 16 |
+
"spearman": 0.6794511626964879
|
| 17 |
+
}
|
| 18 |
+
}
|
| 19 |
+
}
|
evaluation/mteb/STS13.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"dataset_version": null,
|
| 3 |
+
"mteb_version": "0.0.2",
|
| 4 |
+
"test": {
|
| 5 |
+
"cos_sim": {
|
| 6 |
+
"pearson": 0.7708302398877518,
|
| 7 |
+
"spearman": 0.7733151317062642
|
| 8 |
+
},
|
| 9 |
+
"euclidean": {
|
| 10 |
+
"pearson": 0.7677020279715008,
|
| 11 |
+
"spearman": 0.7713893776083225
|
| 12 |
+
},
|
| 13 |
+
"evaluation_time": 12.09,
|
| 14 |
+
"manhattan": {
|
| 15 |
+
"pearson": 0.7676732290707478,
|
| 16 |
+
"spearman": 0.7714500877396631
|
| 17 |
+
}
|
| 18 |
+
}
|
| 19 |
+
}
|