Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add MTEB retrieval results for spice #100

Closed
wants to merge 3 commits into from
Closed
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -0,0 +1,158 @@
{
"dataset_revision": "c22ab2a51041ffd869aaddef7af8d8215647e41a",
"task_name": "ArguAna",
"mteb_version": "1.29.16",
"scores": {
"test": [
{
"ndcg_at_1": 0.49075,
"ndcg_at_3": 0.66383,
"ndcg_at_5": 0.70342,
"ndcg_at_10": 0.72962,
"ndcg_at_20": 0.73723,
"ndcg_at_100": 0.73826,
"ndcg_at_1000": 0.73826,
"map_at_1": 0.49075,
"map_at_3": 0.62138,
"map_at_5": 0.64354,
"map_at_10": 0.65446,
"map_at_20": 0.65668,
"map_at_100": 0.65687,
"map_at_1000": 0.65687,
"recall_at_1": 0.49075,
"recall_at_3": 0.78663,
"recall_at_5": 0.88193,
"recall_at_10": 0.9623,
"recall_at_20": 0.99147,
"recall_at_100": 0.99644,
"recall_at_1000": 0.99644,
"precision_at_1": 0.49075,
"precision_at_3": 0.26221,
"precision_at_5": 0.17639,
"precision_at_10": 0.09623,
"precision_at_20": 0.04957,
"precision_at_100": 0.00996,
"precision_at_1000": 0.001,
"mrr_at_1": 0.502845,
"mrr_at_3": 0.625889,
"mrr_at_5": 0.647653,
"mrr_at_10": 0.658818,
"mrr_at_20": 0.661072,
"mrr_at_100": 0.661224,
"mrr_at_1000": 0.661224,
"nauc_ndcg_at_1_max": -0.208769,
"nauc_ndcg_at_1_std": -0.198636,
"nauc_ndcg_at_1_diff1": 0.188698,
"nauc_ndcg_at_3_max": -0.161218,
"nauc_ndcg_at_3_std": -0.243332,
"nauc_ndcg_at_3_diff1": 0.18716,
"nauc_ndcg_at_5_max": -0.171036,
"nauc_ndcg_at_5_std": -0.243718,
"nauc_ndcg_at_5_diff1": 0.18497,
"nauc_ndcg_at_10_max": -0.189436,
"nauc_ndcg_at_10_std": -0.236004,
"nauc_ndcg_at_10_diff1": 0.172084,
"nauc_ndcg_at_20_max": -0.187444,
"nauc_ndcg_at_20_std": -0.227386,
"nauc_ndcg_at_20_diff1": 0.176302,
"nauc_ndcg_at_100_max": -0.187249,
"nauc_ndcg_at_100_std": -0.224865,
"nauc_ndcg_at_100_diff1": 0.177688,
"nauc_ndcg_at_1000_max": -0.187249,
"nauc_ndcg_at_1000_std": -0.224865,
"nauc_ndcg_at_1000_diff1": 0.177688,
"nauc_map_at_1_max": -0.208769,
"nauc_map_at_1_std": -0.198636,
"nauc_map_at_1_diff1": 0.188698,
"nauc_map_at_3_max": -0.179356,
"nauc_map_at_3_std": -0.23088,
"nauc_map_at_3_diff1": 0.183242,
"nauc_map_at_5_max": -0.185777,
"nauc_map_at_5_std": -0.230461,
"nauc_map_at_5_diff1": 0.181223,
"nauc_map_at_10_max": -0.192355,
"nauc_map_at_10_std": -0.227202,
"nauc_map_at_10_diff1": 0.17675,
"nauc_map_at_20_max": -0.191791,
"nauc_map_at_20_std": -0.225115,
"nauc_map_at_20_diff1": 0.177727,
"nauc_map_at_100_max": -0.191676,
"nauc_map_at_100_std": -0.224732,
"nauc_map_at_100_diff1": 0.178022,
"nauc_map_at_1000_max": -0.191676,
"nauc_map_at_1000_std": -0.224732,
"nauc_map_at_1000_diff1": 0.178022,
"nauc_recall_at_1_max": -0.208769,
"nauc_recall_at_1_std": -0.198636,
"nauc_recall_at_1_diff1": 0.188698,
"nauc_recall_at_3_max": -0.082619,
"nauc_recall_at_3_std": -0.295139,
"nauc_recall_at_3_diff1": 0.20624,
"nauc_recall_at_5_max": -0.070538,
"nauc_recall_at_5_std": -0.330609,
"nauc_recall_at_5_diff1": 0.215717,
"nauc_recall_at_10_max": -0.173445,
"nauc_recall_at_10_std": -0.38724,
"nauc_recall_at_10_diff1": 0.066196,
"nauc_recall_at_20_max": 0.023336,
"nauc_recall_at_20_std": -0.161168,
"nauc_recall_at_20_diff1": 0.077338,
"nauc_recall_at_100_max": 0.297733,
"nauc_recall_at_100_std": 0.581765,
"nauc_recall_at_100_diff1": 0.224523,
"nauc_recall_at_1000_max": 0.297733,
"nauc_recall_at_1000_std": 0.581765,
"nauc_recall_at_1000_diff1": 0.224523,
"nauc_precision_at_1_max": -0.208769,
"nauc_precision_at_1_std": -0.198636,
"nauc_precision_at_1_diff1": 0.188698,
"nauc_precision_at_3_max": -0.082619,
"nauc_precision_at_3_std": -0.295139,
"nauc_precision_at_3_diff1": 0.20624,
"nauc_precision_at_5_max": -0.070538,
"nauc_precision_at_5_std": -0.330609,
"nauc_precision_at_5_diff1": 0.215717,
"nauc_precision_at_10_max": -0.173445,
"nauc_precision_at_10_std": -0.38724,
"nauc_precision_at_10_diff1": 0.066196,
"nauc_precision_at_20_max": 0.023336,
"nauc_precision_at_20_std": -0.161168,
"nauc_precision_at_20_diff1": 0.077338,
"nauc_precision_at_100_max": 0.297733,
"nauc_precision_at_100_std": 0.581765,
"nauc_precision_at_100_diff1": 0.224523,
"nauc_precision_at_1000_max": 0.297733,
"nauc_precision_at_1000_std": 0.581765,
"nauc_precision_at_1000_diff1": 0.224523,
"nauc_mrr_at_1_max": -0.220839,
"nauc_mrr_at_1_std": -0.201151,
"nauc_mrr_at_1_diff1": 0.15525,
"nauc_mrr_at_3_max": -0.208131,
"nauc_mrr_at_3_std": -0.232962,
"nauc_mrr_at_3_diff1": 0.139187,
"nauc_mrr_at_5_max": -0.211804,
"nauc_mrr_at_5_std": -0.234365,
"nauc_mrr_at_5_diff1": 0.139401,
"nauc_mrr_at_10_max": -0.218112,
"nauc_mrr_at_10_std": -0.230586,
"nauc_mrr_at_10_diff1": 0.134302,
"nauc_mrr_at_20_max": -0.217739,
"nauc_mrr_at_20_std": -0.228308,
"nauc_mrr_at_20_diff1": 0.134898,
"nauc_mrr_at_100_max": -0.217698,
"nauc_mrr_at_100_std": -0.228138,
"nauc_mrr_at_100_diff1": 0.135108,
"nauc_mrr_at_1000_max": -0.217698,
"nauc_mrr_at_1000_std": -0.228138,
"nauc_mrr_at_1000_diff1": 0.135108,
"main_score": 0.72962,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 18.87188196182251,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,158 @@
{
"dataset_revision": "f46a197baaae43b4f621051089b82a364682dfeb",
"task_name": "CQADupstackAndroidRetrieval",
"mteb_version": "1.29.16",
"scores": {
"test": [
{
"ndcg_at_1": 0.55365,
"ndcg_at_3": 0.63057,
"ndcg_at_5": 0.6606,
"ndcg_at_10": 0.69708,
"ndcg_at_20": 0.71744,
"ndcg_at_100": 0.73414,
"ndcg_at_1000": 0.73796,
"map_at_1": 0.46084,
"map_at_3": 0.56928,
"map_at_5": 0.59722,
"map_at_10": 0.62033,
"map_at_20": 0.63071,
"map_at_100": 0.6364,
"map_at_1000": 0.63705,
"recall_at_1": 0.46084,
"recall_at_3": 0.6634,
"recall_at_5": 0.7434,
"recall_at_10": 0.85066,
"recall_at_20": 0.91971,
"recall_at_100": 0.98225,
"recall_at_1000": 0.99758,
"precision_at_1": 0.55365,
"precision_at_3": 0.29948,
"precision_at_5": 0.21631,
"precision_at_10": 0.13348,
"precision_at_20": 0.07761,
"precision_at_100": 0.01887,
"precision_at_1000": 0.00217,
"mrr_at_1": 0.553648,
"mrr_at_3": 0.647592,
"mrr_at_5": 0.664688,
"mrr_at_10": 0.676074,
"mrr_at_20": 0.678968,
"mrr_at_100": 0.679913,
"mrr_at_1000": 0.679942,
"nauc_ndcg_at_1_max": 0.422592,
"nauc_ndcg_at_1_std": -0.19572,
"nauc_ndcg_at_1_diff1": 0.618884,
"nauc_ndcg_at_3_max": 0.350547,
"nauc_ndcg_at_3_std": -0.302969,
"nauc_ndcg_at_3_diff1": 0.567468,
"nauc_ndcg_at_5_max": 0.344361,
"nauc_ndcg_at_5_std": -0.309362,
"nauc_ndcg_at_5_diff1": 0.56426,
"nauc_ndcg_at_10_max": 0.350474,
"nauc_ndcg_at_10_std": -0.298407,
"nauc_ndcg_at_10_diff1": 0.569679,
"nauc_ndcg_at_20_max": 0.358757,
"nauc_ndcg_at_20_std": -0.290873,
"nauc_ndcg_at_20_diff1": 0.582582,
"nauc_ndcg_at_100_max": 0.370705,
"nauc_ndcg_at_100_std": -0.261245,
"nauc_ndcg_at_100_diff1": 0.58523,
"nauc_ndcg_at_1000_max": 0.370663,
"nauc_ndcg_at_1000_std": -0.260075,
"nauc_ndcg_at_1000_diff1": 0.585985,
"nauc_map_at_1_max": 0.334696,
"nauc_map_at_1_std": -0.216782,
"nauc_map_at_1_diff1": 0.634936,
"nauc_map_at_3_max": 0.341146,
"nauc_map_at_3_std": -0.292058,
"nauc_map_at_3_diff1": 0.583905,
"nauc_map_at_5_max": 0.350347,
"nauc_map_at_5_std": -0.28942,
"nauc_map_at_5_diff1": 0.579374,
"nauc_map_at_10_max": 0.357238,
"nauc_map_at_10_std": -0.282125,
"nauc_map_at_10_diff1": 0.582397,
"nauc_map_at_20_max": 0.362272,
"nauc_map_at_20_std": -0.273168,
"nauc_map_at_20_diff1": 0.585054,
"nauc_map_at_100_max": 0.364513,
"nauc_map_at_100_std": -0.265953,
"nauc_map_at_100_diff1": 0.584994,
"nauc_map_at_1000_max": 0.364229,
"nauc_map_at_1000_std": -0.266099,
"nauc_map_at_1000_diff1": 0.584968,
"nauc_recall_at_1_max": 0.334696,
"nauc_recall_at_1_std": -0.216782,
"nauc_recall_at_1_diff1": 0.634936,
"nauc_recall_at_3_max": 0.272711,
"nauc_recall_at_3_std": -0.394759,
"nauc_recall_at_3_diff1": 0.508777,
"nauc_recall_at_5_max": 0.248243,
"nauc_recall_at_5_std": -0.423965,
"nauc_recall_at_5_diff1": 0.481199,
"nauc_recall_at_10_max": 0.21494,
"nauc_recall_at_10_std": -0.438422,
"nauc_recall_at_10_diff1": 0.448873,
"nauc_recall_at_20_max": 0.165958,
"nauc_recall_at_20_std": -0.520014,
"nauc_recall_at_20_diff1": 0.463587,
"nauc_recall_at_100_max": 0.29364,
"nauc_recall_at_100_std": -0.172103,
"nauc_recall_at_100_diff1": 0.383,
"nauc_recall_at_1000_max": 0.61684,
"nauc_recall_at_1000_std": 0.34679,
"nauc_recall_at_1000_diff1": 0.627576,
"nauc_precision_at_1_max": 0.422592,
"nauc_precision_at_1_std": -0.19572,
"nauc_precision_at_1_diff1": 0.618884,
"nauc_precision_at_3_max": 0.233391,
"nauc_precision_at_3_std": -0.163685,
"nauc_precision_at_3_diff1": 0.16895,
"nauc_precision_at_5_max": 0.140338,
"nauc_precision_at_5_std": -0.048204,
"nauc_precision_at_5_diff1": 0.002574,
"nauc_precision_at_10_max": 0.043931,
"nauc_precision_at_10_std": 0.08571,
"nauc_precision_at_10_diff1": -0.139889,
"nauc_precision_at_20_max": -0.008687,
"nauc_precision_at_20_std": 0.17433,
"nauc_precision_at_20_diff1": -0.201591,
"nauc_precision_at_100_max": -0.088065,
"nauc_precision_at_100_std": 0.201744,
"nauc_precision_at_100_diff1": -0.261524,
"nauc_precision_at_1000_max": -0.168536,
"nauc_precision_at_1000_std": 0.096805,
"nauc_precision_at_1000_diff1": -0.295068,
"nauc_mrr_at_1_max": 0.422592,
"nauc_mrr_at_1_std": -0.19572,
"nauc_mrr_at_1_diff1": 0.618884,
"nauc_mrr_at_3_max": 0.395577,
"nauc_mrr_at_3_std": -0.262852,
"nauc_mrr_at_3_diff1": 0.599129,
"nauc_mrr_at_5_max": 0.393361,
"nauc_mrr_at_5_std": -0.264697,
"nauc_mrr_at_5_diff1": 0.599879,
"nauc_mrr_at_10_max": 0.395371,
"nauc_mrr_at_10_std": -0.256368,
"nauc_mrr_at_10_diff1": 0.600975,
"nauc_mrr_at_20_max": 0.395465,
"nauc_mrr_at_20_std": -0.256893,
"nauc_mrr_at_20_diff1": 0.602712,
"nauc_mrr_at_100_max": 0.396742,
"nauc_mrr_at_100_std": -0.254594,
"nauc_mrr_at_100_diff1": 0.602411,
"nauc_mrr_at_1000_max": 0.396739,
"nauc_mrr_at_1000_std": -0.254588,
"nauc_mrr_at_1000_diff1": 0.602419,
"main_score": 0.69708,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 23.853569507598877,
"kg_co2_emissions": null
}
Loading
Loading