Spaces:
AIR-Bench
/
Restarting on CPU Upgrade

leaderboard / tests /toydata /test_data.json
nan's picture
feat: adapt the data loading part
8b7a945
raw
history blame
1.86 kB
[
{
"config": {
"retrieval_model": "bge-m3",
"reranking_model": "bge-reranker-v2-m3",
"task": "long_doc",
"metric": "ndcg_at_1"
},
"results": [
{
"domain": "law",
"lang": "en",
"dataset": "lex_files_500K-600K",
"value": 0.75723
}
]
},
{
"config": {
"retrieval_model": "bge-m3",
"reranking_model": "bge-reranker-v2-m3",
"task": "long_doc",
"metric": "ndcg_at_3"
},
"results": [
{
"domain": "law",
"lang": "en",
"dataset": "lex_files_500K-600K",
"value": 0.69909
}
]
},
{
"config": {
"retrieval_model": "bge-m3",
"reranking_model": "bge-reranker-v2-m3",
"task": "qa",
"metric": "ndcg_at_1"
},
"results": [
{
"domain": "wiki",
"lang": "en",
"dataset": "unknown",
"value": 0.69083
}
]
},
{
"config": {
"retrieval_model": "bge-m3",
"reranking_model": "bge-reranker-v2-m3",
"task": "qa",
"metric": "ndcg_at_3"
},
"results": [
{
"domain": "wiki",
"lang": "en",
"dataset": "unknown",
"value": 0.73359
}
]
},
{
"config": {
"retrieval_model": "bge-m3",
"reranking_model": "bge-reranker-v2-m3",
"task": "qa",
"metric": "ndcg_at_1"
},
"results": [
{
"domain": "wiki",
"lang": "zh",
"dataset": "unknown",
"value": 0.78358
}
]
},
{
"config": {
"retrieval_model": "bge-m3",
"reranking_model": "bge-reranker-v2-m3",
"task": "qa",
"metric": "ndcg_at_3"
},
"results": [
{
"domain": "wiki",
"lang": "zh",
"dataset": "unknown",
"value": 0.78358
}
]
}
]