diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/ArguAna.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/ArguAna.json new file mode 100644 index 000000000..094738976 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/ArguAna.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "c22ab2a51041ffd869aaddef7af8d8215647e41a", + "task_name": "ArguAna", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.49075, + "ndcg_at_3": 0.66383, + "ndcg_at_5": 0.70342, + "ndcg_at_10": 0.72962, + "ndcg_at_20": 0.73723, + "ndcg_at_100": 0.73826, + "ndcg_at_1000": 0.73826, + "map_at_1": 0.49075, + "map_at_3": 0.62138, + "map_at_5": 0.64354, + "map_at_10": 0.65446, + "map_at_20": 0.65668, + "map_at_100": 0.65687, + "map_at_1000": 0.65687, + "recall_at_1": 0.49075, + "recall_at_3": 0.78663, + "recall_at_5": 0.88193, + "recall_at_10": 0.9623, + "recall_at_20": 0.99147, + "recall_at_100": 0.99644, + "recall_at_1000": 0.99644, + "precision_at_1": 0.49075, + "precision_at_3": 0.26221, + "precision_at_5": 0.17639, + "precision_at_10": 0.09623, + "precision_at_20": 0.04957, + "precision_at_100": 0.00996, + "precision_at_1000": 0.001, + "mrr_at_1": 0.502845, + "mrr_at_3": 0.625889, + "mrr_at_5": 0.647653, + "mrr_at_10": 0.658818, + "mrr_at_20": 0.661072, + "mrr_at_100": 0.661224, + "mrr_at_1000": 0.661224, + "nauc_ndcg_at_1_max": -0.208769, + "nauc_ndcg_at_1_std": -0.198636, + "nauc_ndcg_at_1_diff1": 0.188698, + "nauc_ndcg_at_3_max": -0.161218, + "nauc_ndcg_at_3_std": -0.243332, + "nauc_ndcg_at_3_diff1": 0.18716, + "nauc_ndcg_at_5_max": -0.171036, + "nauc_ndcg_at_5_std": -0.243718, + "nauc_ndcg_at_5_diff1": 0.18497, + "nauc_ndcg_at_10_max": -0.189436, + "nauc_ndcg_at_10_std": -0.236004, + "nauc_ndcg_at_10_diff1": 0.172084, + "nauc_ndcg_at_20_max": -0.187444, + "nauc_ndcg_at_20_std": -0.227386, + "nauc_ndcg_at_20_diff1": 0.176302, + "nauc_ndcg_at_100_max": -0.187249, + "nauc_ndcg_at_100_std": -0.224865, + "nauc_ndcg_at_100_diff1": 0.177688, + "nauc_ndcg_at_1000_max": -0.187249, + "nauc_ndcg_at_1000_std": -0.224865, + "nauc_ndcg_at_1000_diff1": 0.177688, + "nauc_map_at_1_max": -0.208769, + "nauc_map_at_1_std": -0.198636, + "nauc_map_at_1_diff1": 0.188698, + "nauc_map_at_3_max": -0.179356, + "nauc_map_at_3_std": -0.23088, + "nauc_map_at_3_diff1": 0.183242, + "nauc_map_at_5_max": -0.185777, + "nauc_map_at_5_std": -0.230461, + "nauc_map_at_5_diff1": 0.181223, + "nauc_map_at_10_max": -0.192355, + "nauc_map_at_10_std": -0.227202, + "nauc_map_at_10_diff1": 0.17675, + "nauc_map_at_20_max": -0.191791, + "nauc_map_at_20_std": -0.225115, + "nauc_map_at_20_diff1": 0.177727, + "nauc_map_at_100_max": -0.191676, + "nauc_map_at_100_std": -0.224732, + "nauc_map_at_100_diff1": 0.178022, + "nauc_map_at_1000_max": -0.191676, + "nauc_map_at_1000_std": -0.224732, + "nauc_map_at_1000_diff1": 0.178022, + "nauc_recall_at_1_max": -0.208769, + "nauc_recall_at_1_std": -0.198636, + "nauc_recall_at_1_diff1": 0.188698, + "nauc_recall_at_3_max": -0.082619, + "nauc_recall_at_3_std": -0.295139, + "nauc_recall_at_3_diff1": 0.20624, + "nauc_recall_at_5_max": -0.070538, + "nauc_recall_at_5_std": -0.330609, + "nauc_recall_at_5_diff1": 0.215717, + "nauc_recall_at_10_max": -0.173445, + "nauc_recall_at_10_std": -0.38724, + "nauc_recall_at_10_diff1": 0.066196, + "nauc_recall_at_20_max": 0.023336, + "nauc_recall_at_20_std": -0.161168, + "nauc_recall_at_20_diff1": 0.077338, + "nauc_recall_at_100_max": 0.297733, + "nauc_recall_at_100_std": 0.581765, + "nauc_recall_at_100_diff1": 0.224523, + "nauc_recall_at_1000_max": 0.297733, + "nauc_recall_at_1000_std": 0.581765, + "nauc_recall_at_1000_diff1": 0.224523, + "nauc_precision_at_1_max": -0.208769, + "nauc_precision_at_1_std": -0.198636, + "nauc_precision_at_1_diff1": 0.188698, + "nauc_precision_at_3_max": -0.082619, + "nauc_precision_at_3_std": -0.295139, + "nauc_precision_at_3_diff1": 0.20624, + "nauc_precision_at_5_max": -0.070538, + "nauc_precision_at_5_std": -0.330609, + "nauc_precision_at_5_diff1": 0.215717, + "nauc_precision_at_10_max": -0.173445, + "nauc_precision_at_10_std": -0.38724, + "nauc_precision_at_10_diff1": 0.066196, + "nauc_precision_at_20_max": 0.023336, + "nauc_precision_at_20_std": -0.161168, + "nauc_precision_at_20_diff1": 0.077338, + "nauc_precision_at_100_max": 0.297733, + "nauc_precision_at_100_std": 0.581765, + "nauc_precision_at_100_diff1": 0.224523, + "nauc_precision_at_1000_max": 0.297733, + "nauc_precision_at_1000_std": 0.581765, + "nauc_precision_at_1000_diff1": 0.224523, + "nauc_mrr_at_1_max": -0.220839, + "nauc_mrr_at_1_std": -0.201151, + "nauc_mrr_at_1_diff1": 0.15525, + "nauc_mrr_at_3_max": -0.208131, + "nauc_mrr_at_3_std": -0.232962, + "nauc_mrr_at_3_diff1": 0.139187, + "nauc_mrr_at_5_max": -0.211804, + "nauc_mrr_at_5_std": -0.234365, + "nauc_mrr_at_5_diff1": 0.139401, + "nauc_mrr_at_10_max": -0.218112, + "nauc_mrr_at_10_std": -0.230586, + "nauc_mrr_at_10_diff1": 0.134302, + "nauc_mrr_at_20_max": -0.217739, + "nauc_mrr_at_20_std": -0.228308, + "nauc_mrr_at_20_diff1": 0.134898, + "nauc_mrr_at_100_max": -0.217698, + "nauc_mrr_at_100_std": -0.228138, + "nauc_mrr_at_100_diff1": 0.135108, + "nauc_mrr_at_1000_max": -0.217698, + "nauc_mrr_at_1000_std": -0.228138, + "nauc_mrr_at_1000_diff1": 0.135108, + "main_score": 0.72962, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 18.87188196182251, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackAndroidRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackAndroidRetrieval.json new file mode 100644 index 000000000..a39977475 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackAndroidRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "f46a197baaae43b4f621051089b82a364682dfeb", + "task_name": "CQADupstackAndroidRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.55365, + "ndcg_at_3": 0.63057, + "ndcg_at_5": 0.6606, + "ndcg_at_10": 0.69708, + "ndcg_at_20": 0.71744, + "ndcg_at_100": 0.73414, + "ndcg_at_1000": 0.73796, + "map_at_1": 0.46084, + "map_at_3": 0.56928, + "map_at_5": 0.59722, + "map_at_10": 0.62033, + "map_at_20": 0.63071, + "map_at_100": 0.6364, + "map_at_1000": 0.63705, + "recall_at_1": 0.46084, + "recall_at_3": 0.6634, + "recall_at_5": 0.7434, + "recall_at_10": 0.85066, + "recall_at_20": 0.91971, + "recall_at_100": 0.98225, + "recall_at_1000": 0.99758, + "precision_at_1": 0.55365, + "precision_at_3": 0.29948, + "precision_at_5": 0.21631, + "precision_at_10": 0.13348, + "precision_at_20": 0.07761, + "precision_at_100": 0.01887, + "precision_at_1000": 0.00217, + "mrr_at_1": 0.553648, + "mrr_at_3": 0.647592, + "mrr_at_5": 0.664688, + "mrr_at_10": 0.676074, + "mrr_at_20": 0.678968, + "mrr_at_100": 0.679913, + "mrr_at_1000": 0.679942, + "nauc_ndcg_at_1_max": 0.422592, + "nauc_ndcg_at_1_std": -0.19572, + "nauc_ndcg_at_1_diff1": 0.618884, + "nauc_ndcg_at_3_max": 0.350547, + "nauc_ndcg_at_3_std": -0.302969, + "nauc_ndcg_at_3_diff1": 0.567468, + "nauc_ndcg_at_5_max": 0.344361, + "nauc_ndcg_at_5_std": -0.309362, + "nauc_ndcg_at_5_diff1": 0.56426, + "nauc_ndcg_at_10_max": 0.350474, + "nauc_ndcg_at_10_std": -0.298407, + "nauc_ndcg_at_10_diff1": 0.569679, + "nauc_ndcg_at_20_max": 0.358757, + "nauc_ndcg_at_20_std": -0.290873, + "nauc_ndcg_at_20_diff1": 0.582582, + "nauc_ndcg_at_100_max": 0.370705, + "nauc_ndcg_at_100_std": -0.261245, + "nauc_ndcg_at_100_diff1": 0.58523, + "nauc_ndcg_at_1000_max": 0.370663, + "nauc_ndcg_at_1000_std": -0.260075, + "nauc_ndcg_at_1000_diff1": 0.585985, + "nauc_map_at_1_max": 0.334696, + "nauc_map_at_1_std": -0.216782, + "nauc_map_at_1_diff1": 0.634936, + "nauc_map_at_3_max": 0.341146, + "nauc_map_at_3_std": -0.292058, + "nauc_map_at_3_diff1": 0.583905, + "nauc_map_at_5_max": 0.350347, + "nauc_map_at_5_std": -0.28942, + "nauc_map_at_5_diff1": 0.579374, + "nauc_map_at_10_max": 0.357238, + "nauc_map_at_10_std": -0.282125, + "nauc_map_at_10_diff1": 0.582397, + "nauc_map_at_20_max": 0.362272, + "nauc_map_at_20_std": -0.273168, + "nauc_map_at_20_diff1": 0.585054, + "nauc_map_at_100_max": 0.364513, + "nauc_map_at_100_std": -0.265953, + "nauc_map_at_100_diff1": 0.584994, + "nauc_map_at_1000_max": 0.364229, + "nauc_map_at_1000_std": -0.266099, + "nauc_map_at_1000_diff1": 0.584968, + "nauc_recall_at_1_max": 0.334696, + "nauc_recall_at_1_std": -0.216782, + "nauc_recall_at_1_diff1": 0.634936, + "nauc_recall_at_3_max": 0.272711, + "nauc_recall_at_3_std": -0.394759, + "nauc_recall_at_3_diff1": 0.508777, + "nauc_recall_at_5_max": 0.248243, + "nauc_recall_at_5_std": -0.423965, + "nauc_recall_at_5_diff1": 0.481199, + "nauc_recall_at_10_max": 0.21494, + "nauc_recall_at_10_std": -0.438422, + "nauc_recall_at_10_diff1": 0.448873, + "nauc_recall_at_20_max": 0.165958, + "nauc_recall_at_20_std": -0.520014, + "nauc_recall_at_20_diff1": 0.463587, + "nauc_recall_at_100_max": 0.29364, + "nauc_recall_at_100_std": -0.172103, + "nauc_recall_at_100_diff1": 0.383, + "nauc_recall_at_1000_max": 0.61684, + "nauc_recall_at_1000_std": 0.34679, + "nauc_recall_at_1000_diff1": 0.627576, + "nauc_precision_at_1_max": 0.422592, + "nauc_precision_at_1_std": -0.19572, + "nauc_precision_at_1_diff1": 0.618884, + "nauc_precision_at_3_max": 0.233391, + "nauc_precision_at_3_std": -0.163685, + "nauc_precision_at_3_diff1": 0.16895, + "nauc_precision_at_5_max": 0.140338, + "nauc_precision_at_5_std": -0.048204, + "nauc_precision_at_5_diff1": 0.002574, + "nauc_precision_at_10_max": 0.043931, + "nauc_precision_at_10_std": 0.08571, + "nauc_precision_at_10_diff1": -0.139889, + "nauc_precision_at_20_max": -0.008687, + "nauc_precision_at_20_std": 0.17433, + "nauc_precision_at_20_diff1": -0.201591, + "nauc_precision_at_100_max": -0.088065, + "nauc_precision_at_100_std": 0.201744, + "nauc_precision_at_100_diff1": -0.261524, + "nauc_precision_at_1000_max": -0.168536, + "nauc_precision_at_1000_std": 0.096805, + "nauc_precision_at_1000_diff1": -0.295068, + "nauc_mrr_at_1_max": 0.422592, + "nauc_mrr_at_1_std": -0.19572, + "nauc_mrr_at_1_diff1": 0.618884, + "nauc_mrr_at_3_max": 0.395577, + "nauc_mrr_at_3_std": -0.262852, + "nauc_mrr_at_3_diff1": 0.599129, + "nauc_mrr_at_5_max": 0.393361, + "nauc_mrr_at_5_std": -0.264697, + "nauc_mrr_at_5_diff1": 0.599879, + "nauc_mrr_at_10_max": 0.395371, + "nauc_mrr_at_10_std": -0.256368, + "nauc_mrr_at_10_diff1": 0.600975, + "nauc_mrr_at_20_max": 0.395465, + "nauc_mrr_at_20_std": -0.256893, + "nauc_mrr_at_20_diff1": 0.602712, + "nauc_mrr_at_100_max": 0.396742, + "nauc_mrr_at_100_std": -0.254594, + "nauc_mrr_at_100_diff1": 0.602411, + "nauc_mrr_at_1000_max": 0.396739, + "nauc_mrr_at_1000_std": -0.254588, + "nauc_mrr_at_1000_diff1": 0.602419, + "main_score": 0.69708, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 23.853569507598877, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackEnglishRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackEnglishRetrieval.json new file mode 100644 index 000000000..30721c719 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackEnglishRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "ad9991cb51e31e31e430383c75ffb2885547b5f0", + "task_name": "CQADupstackEnglishRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.58535, + "ndcg_at_3": 0.66319, + "ndcg_at_5": 0.69091, + "ndcg_at_10": 0.72224, + "ndcg_at_20": 0.73965, + "ndcg_at_100": 0.7531, + "ndcg_at_1000": 0.75832, + "map_at_1": 0.47624, + "map_at_3": 0.59966, + "map_at_5": 0.62462, + "map_at_10": 0.64625, + "map_at_20": 0.65539, + "map_at_100": 0.66075, + "map_at_1000": 0.66158, + "recall_at_1": 0.47624, + "recall_at_3": 0.6992, + "recall_at_5": 0.77549, + "recall_at_10": 0.86624, + "recall_at_20": 0.92454, + "recall_at_100": 0.97427, + "recall_at_1000": 0.99277, + "precision_at_1": 0.58535, + "precision_at_3": 0.32166, + "precision_at_5": 0.22599, + "precision_at_10": 0.13713, + "precision_at_20": 0.07904, + "precision_at_100": 0.01925, + "precision_at_1000": 0.00222, + "mrr_at_1": 0.58535, + "mrr_at_3": 0.679618, + "mrr_at_5": 0.695255, + "mrr_at_10": 0.704839, + "mrr_at_20": 0.707685, + "mrr_at_100": 0.708376, + "mrr_at_1000": 0.70838, + "nauc_ndcg_at_1_max": 0.383089, + "nauc_ndcg_at_1_std": -0.126909, + "nauc_ndcg_at_1_diff1": 0.58578, + "nauc_ndcg_at_3_max": 0.372876, + "nauc_ndcg_at_3_std": -0.17427, + "nauc_ndcg_at_3_diff1": 0.547567, + "nauc_ndcg_at_5_max": 0.378316, + "nauc_ndcg_at_5_std": -0.167885, + "nauc_ndcg_at_5_diff1": 0.558766, + "nauc_ndcg_at_10_max": 0.381842, + "nauc_ndcg_at_10_std": -0.165728, + "nauc_ndcg_at_10_diff1": 0.562349, + "nauc_ndcg_at_20_max": 0.385685, + "nauc_ndcg_at_20_std": -0.152507, + "nauc_ndcg_at_20_diff1": 0.566075, + "nauc_ndcg_at_100_max": 0.384251, + "nauc_ndcg_at_100_std": -0.142081, + "nauc_ndcg_at_100_diff1": 0.561551, + "nauc_ndcg_at_1000_max": 0.382494, + "nauc_ndcg_at_1000_std": -0.13881, + "nauc_ndcg_at_1000_diff1": 0.559643, + "nauc_map_at_1_max": 0.274788, + "nauc_map_at_1_std": -0.19611, + "nauc_map_at_1_diff1": 0.592439, + "nauc_map_at_3_max": 0.327272, + "nauc_map_at_3_std": -0.218318, + "nauc_map_at_3_diff1": 0.569733, + "nauc_map_at_5_max": 0.343323, + "nauc_map_at_5_std": -0.205513, + "nauc_map_at_5_diff1": 0.572952, + "nauc_map_at_10_max": 0.353871, + "nauc_map_at_10_std": -0.192389, + "nauc_map_at_10_diff1": 0.572092, + "nauc_map_at_20_max": 0.360572, + "nauc_map_at_20_std": -0.178373, + "nauc_map_at_20_diff1": 0.570262, + "nauc_map_at_100_max": 0.364464, + "nauc_map_at_100_std": -0.167724, + "nauc_map_at_100_diff1": 0.566786, + "nauc_map_at_1000_max": 0.364626, + "nauc_map_at_1000_std": -0.166057, + "nauc_map_at_1000_diff1": 0.56646, + "nauc_recall_at_1_max": 0.274788, + "nauc_recall_at_1_std": -0.19611, + "nauc_recall_at_1_diff1": 0.592439, + "nauc_recall_at_3_max": 0.302654, + "nauc_recall_at_3_std": -0.261451, + "nauc_recall_at_3_diff1": 0.505101, + "nauc_recall_at_5_max": 0.327025, + "nauc_recall_at_5_std": -0.230717, + "nauc_recall_at_5_diff1": 0.50679, + "nauc_recall_at_10_max": 0.342029, + "nauc_recall_at_10_std": -0.242381, + "nauc_recall_at_10_diff1": 0.494372, + "nauc_recall_at_20_max": 0.369285, + "nauc_recall_at_20_std": -0.185885, + "nauc_recall_at_20_diff1": 0.5057, + "nauc_recall_at_100_max": 0.413247, + "nauc_recall_at_100_std": -0.008846, + "nauc_recall_at_100_diff1": 0.460503, + "nauc_recall_at_1000_max": 0.462133, + "nauc_recall_at_1000_std": 0.116651, + "nauc_recall_at_1000_diff1": 0.386658, + "nauc_precision_at_1_max": 0.383089, + "nauc_precision_at_1_std": -0.126909, + "nauc_precision_at_1_diff1": 0.58578, + "nauc_precision_at_3_max": 0.286936, + "nauc_precision_at_3_std": -0.001582, + "nauc_precision_at_3_diff1": 0.132702, + "nauc_precision_at_5_max": 0.235334, + "nauc_precision_at_5_std": 0.111857, + "nauc_precision_at_5_diff1": -0.001052, + "nauc_precision_at_10_max": 0.149699, + "nauc_precision_at_10_std": 0.225928, + "nauc_precision_at_10_diff1": -0.154609, + "nauc_precision_at_20_max": 0.099003, + "nauc_precision_at_20_std": 0.326979, + "nauc_precision_at_20_diff1": -0.244865, + "nauc_precision_at_100_max": 0.02782, + "nauc_precision_at_100_std": 0.387103, + "nauc_precision_at_100_diff1": -0.313831, + "nauc_precision_at_1000_max": -0.02666, + "nauc_precision_at_1000_std": 0.356735, + "nauc_precision_at_1000_diff1": -0.312823, + "nauc_mrr_at_1_max": 0.383089, + "nauc_mrr_at_1_std": -0.126909, + "nauc_mrr_at_1_diff1": 0.58578, + "nauc_mrr_at_3_max": 0.392096, + "nauc_mrr_at_3_std": -0.146533, + "nauc_mrr_at_3_diff1": 0.558167, + "nauc_mrr_at_5_max": 0.399421, + "nauc_mrr_at_5_std": -0.132698, + "nauc_mrr_at_5_diff1": 0.564035, + "nauc_mrr_at_10_max": 0.398463, + "nauc_mrr_at_10_std": -0.132316, + "nauc_mrr_at_10_diff1": 0.564881, + "nauc_mrr_at_20_max": 0.397811, + "nauc_mrr_at_20_std": -0.131735, + "nauc_mrr_at_20_diff1": 0.565786, + "nauc_mrr_at_100_max": 0.397474, + "nauc_mrr_at_100_std": -0.131607, + "nauc_mrr_at_100_diff1": 0.565708, + "nauc_mrr_at_1000_max": 0.397466, + "nauc_mrr_at_1000_std": -0.131623, + "nauc_mrr_at_1000_diff1": 0.565706, + "main_score": 0.72224, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 34.536805868148804, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackGamingRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackGamingRetrieval.json new file mode 100644 index 000000000..94a14f995 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackGamingRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "4885aa143210c98657558c04aaf3dc47cfb54340", + "task_name": "CQADupstackGamingRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.61317, + "ndcg_at_3": 0.70074, + "ndcg_at_5": 0.73005, + "ndcg_at_10": 0.76187, + "ndcg_at_20": 0.77625, + "ndcg_at_100": 0.78339, + "ndcg_at_1000": 0.78412, + "map_at_1": 0.54168, + "map_at_3": 0.65961, + "map_at_5": 0.68264, + "map_at_10": 0.69984, + "map_at_20": 0.70592, + "map_at_100": 0.70784, + "map_at_1000": 0.70794, + "recall_at_1": 0.54168, + "recall_at_3": 0.75543, + "recall_at_5": 0.82757, + "recall_at_10": 0.91715, + "recall_at_20": 0.96757, + "recall_at_100": 0.99685, + "recall_at_1000": 0.99988, + "precision_at_1": 0.61317, + "precision_at_3": 0.31014, + "precision_at_5": 0.21003, + "precision_at_10": 0.12025, + "precision_at_20": 0.0652, + "precision_at_100": 0.01389, + "precision_at_1000": 0.00142, + "mrr_at_1": 0.613166, + "mrr_at_3": 0.700104, + "mrr_at_5": 0.713678, + "mrr_at_10": 0.724371, + "mrr_at_20": 0.726872, + "mrr_at_100": 0.727451, + "mrr_at_1000": 0.727455, + "nauc_ndcg_at_1_max": 0.492292, + "nauc_ndcg_at_1_std": -0.188481, + "nauc_ndcg_at_1_diff1": 0.63895, + "nauc_ndcg_at_3_max": 0.432067, + "nauc_ndcg_at_3_std": -0.283048, + "nauc_ndcg_at_3_diff1": 0.594342, + "nauc_ndcg_at_5_max": 0.437297, + "nauc_ndcg_at_5_std": -0.294965, + "nauc_ndcg_at_5_diff1": 0.603543, + "nauc_ndcg_at_10_max": 0.444657, + "nauc_ndcg_at_10_std": -0.286372, + "nauc_ndcg_at_10_diff1": 0.611574, + "nauc_ndcg_at_20_max": 0.452216, + "nauc_ndcg_at_20_std": -0.26997, + "nauc_ndcg_at_20_diff1": 0.610496, + "nauc_ndcg_at_100_max": 0.456445, + "nauc_ndcg_at_100_std": -0.251439, + "nauc_ndcg_at_100_diff1": 0.611359, + "nauc_ndcg_at_1000_max": 0.458025, + "nauc_ndcg_at_1000_std": -0.25136, + "nauc_ndcg_at_1000_diff1": 0.612799, + "nauc_map_at_1_max": 0.407535, + "nauc_map_at_1_std": -0.186058, + "nauc_map_at_1_diff1": 0.642096, + "nauc_map_at_3_max": 0.431977, + "nauc_map_at_3_std": -0.26648, + "nauc_map_at_3_diff1": 0.608231, + "nauc_map_at_5_max": 0.440427, + "nauc_map_at_5_std": -0.266642, + "nauc_map_at_5_diff1": 0.610442, + "nauc_map_at_10_max": 0.444979, + "nauc_map_at_10_std": -0.259539, + "nauc_map_at_10_diff1": 0.612967, + "nauc_map_at_20_max": 0.449539, + "nauc_map_at_20_std": -0.252611, + "nauc_map_at_20_diff1": 0.613101, + "nauc_map_at_100_max": 0.451301, + "nauc_map_at_100_std": -0.248142, + "nauc_map_at_100_diff1": 0.613169, + "nauc_map_at_1000_max": 0.451525, + "nauc_map_at_1000_std": -0.248162, + "nauc_map_at_1000_diff1": 0.613367, + "nauc_recall_at_1_max": 0.407535, + "nauc_recall_at_1_std": -0.186058, + "nauc_recall_at_1_diff1": 0.642096, + "nauc_recall_at_3_max": 0.355875, + "nauc_recall_at_3_std": -0.380289, + "nauc_recall_at_3_diff1": 0.541901, + "nauc_recall_at_5_max": 0.348461, + "nauc_recall_at_5_std": -0.445271, + "nauc_recall_at_5_diff1": 0.542183, + "nauc_recall_at_10_max": 0.326802, + "nauc_recall_at_10_std": -0.544557, + "nauc_recall_at_10_diff1": 0.556051, + "nauc_recall_at_20_max": 0.326068, + "nauc_recall_at_20_std": -0.6511, + "nauc_recall_at_20_diff1": 0.512828, + "nauc_recall_at_100_max": 0.043244, + "nauc_recall_at_100_std": -0.275468, + "nauc_recall_at_100_diff1": 0.187239, + "nauc_recall_at_1000_max": -0.373278, + "nauc_recall_at_1000_std": 0.143698, + "nauc_recall_at_1000_diff1": -0.283576, + "nauc_precision_at_1_max": 0.492292, + "nauc_precision_at_1_std": -0.188481, + "nauc_precision_at_1_diff1": 0.63895, + "nauc_precision_at_3_max": 0.267722, + "nauc_precision_at_3_std": -0.15659, + "nauc_precision_at_3_diff1": 0.156679, + "nauc_precision_at_5_max": 0.197119, + "nauc_precision_at_5_std": -0.075274, + "nauc_precision_at_5_diff1": 0.033285, + "nauc_precision_at_10_max": 0.098735, + "nauc_precision_at_10_std": 0.046497, + "nauc_precision_at_10_diff1": -0.119502, + "nauc_precision_at_20_max": 0.053981, + "nauc_precision_at_20_std": 0.150335, + "nauc_precision_at_20_diff1": -0.203357, + "nauc_precision_at_100_max": 0.026472, + "nauc_precision_at_100_std": 0.222767, + "nauc_precision_at_100_diff1": -0.238711, + "nauc_precision_at_1000_max": 0.031739, + "nauc_precision_at_1000_std": 0.208791, + "nauc_precision_at_1000_diff1": -0.219596, + "nauc_mrr_at_1_max": 0.492292, + "nauc_mrr_at_1_std": -0.188481, + "nauc_mrr_at_1_diff1": 0.63895, + "nauc_mrr_at_3_max": 0.460086, + "nauc_mrr_at_3_std": -0.255348, + "nauc_mrr_at_3_diff1": 0.610057, + "nauc_mrr_at_5_max": 0.464483, + "nauc_mrr_at_5_std": -0.257418, + "nauc_mrr_at_5_diff1": 0.614409, + "nauc_mrr_at_10_max": 0.467839, + "nauc_mrr_at_10_std": -0.252021, + "nauc_mrr_at_10_diff1": 0.617885, + "nauc_mrr_at_20_max": 0.467958, + "nauc_mrr_at_20_std": -0.249689, + "nauc_mrr_at_20_diff1": 0.617242, + "nauc_mrr_at_100_max": 0.467966, + "nauc_mrr_at_100_std": -0.248663, + "nauc_mrr_at_100_diff1": 0.617441, + "nauc_mrr_at_1000_max": 0.467968, + "nauc_mrr_at_1000_std": -0.248664, + "nauc_mrr_at_1000_diff1": 0.61745, + "main_score": 0.76187, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 37.885751485824585, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackGisRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackGisRetrieval.json new file mode 100644 index 000000000..77d68e90c --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackGisRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "5003b3064772da1887988e05400cf3806fe491f2", + "task_name": "CQADupstackGisRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.39209, + "ndcg_at_3": 0.49285, + "ndcg_at_5": 0.53802, + "ndcg_at_10": 0.58292, + "ndcg_at_20": 0.60535, + "ndcg_at_100": 0.62496, + "ndcg_at_1000": 0.6275, + "map_at_1": 0.36186, + "map_at_3": 0.45573, + "map_at_5": 0.48263, + "map_at_10": 0.50272, + "map_at_20": 0.50951, + "map_at_100": 0.51311, + "map_at_1000": 0.51327, + "recall_at_1": 0.36186, + "recall_at_3": 0.5683, + "recall_at_5": 0.67638, + "recall_at_10": 0.81012, + "recall_at_20": 0.89322, + "recall_at_100": 0.98428, + "recall_at_1000": 0.9988, + "precision_at_1": 0.39209, + "precision_at_3": 0.21281, + "precision_at_5": 0.1539, + "precision_at_10": 0.09356, + "precision_at_20": 0.05226, + "precision_at_100": 0.01195, + "precision_at_1000": 0.00125, + "mrr_at_1": 0.39209, + "mrr_at_3": 0.483427, + "mrr_at_5": 0.50823, + "mrr_at_10": 0.525361, + "mrr_at_20": 0.530801, + "mrr_at_100": 0.532966, + "mrr_at_1000": 0.533008, + "nauc_ndcg_at_1_max": 0.264662, + "nauc_ndcg_at_1_std": -0.212828, + "nauc_ndcg_at_1_diff1": 0.478894, + "nauc_ndcg_at_3_max": 0.185822, + "nauc_ndcg_at_3_std": -0.277958, + "nauc_ndcg_at_3_diff1": 0.405278, + "nauc_ndcg_at_5_max": 0.168616, + "nauc_ndcg_at_5_std": -0.287117, + "nauc_ndcg_at_5_diff1": 0.385456, + "nauc_ndcg_at_10_max": 0.185365, + "nauc_ndcg_at_10_std": -0.309575, + "nauc_ndcg_at_10_diff1": 0.405441, + "nauc_ndcg_at_20_max": 0.184698, + "nauc_ndcg_at_20_std": -0.2971, + "nauc_ndcg_at_20_diff1": 0.404647, + "nauc_ndcg_at_100_max": 0.192428, + "nauc_ndcg_at_100_std": -0.281362, + "nauc_ndcg_at_100_diff1": 0.411844, + "nauc_ndcg_at_1000_max": 0.194941, + "nauc_ndcg_at_1000_std": -0.280267, + "nauc_ndcg_at_1000_diff1": 0.413603, + "nauc_map_at_1_max": 0.227285, + "nauc_map_at_1_std": -0.227251, + "nauc_map_at_1_diff1": 0.484454, + "nauc_map_at_3_max": 0.192609, + "nauc_map_at_3_std": -0.267488, + "nauc_map_at_3_diff1": 0.424627, + "nauc_map_at_5_max": 0.185206, + "nauc_map_at_5_std": -0.272879, + "nauc_map_at_5_diff1": 0.412663, + "nauc_map_at_10_max": 0.192548, + "nauc_map_at_10_std": -0.280495, + "nauc_map_at_10_diff1": 0.41906, + "nauc_map_at_20_max": 0.192641, + "nauc_map_at_20_std": -0.27723, + "nauc_map_at_20_diff1": 0.419023, + "nauc_map_at_100_max": 0.194105, + "nauc_map_at_100_std": -0.275153, + "nauc_map_at_100_diff1": 0.420078, + "nauc_map_at_1000_max": 0.194185, + "nauc_map_at_1000_std": -0.275119, + "nauc_map_at_1000_diff1": 0.420182, + "nauc_recall_at_1_max": 0.227285, + "nauc_recall_at_1_std": -0.227251, + "nauc_recall_at_1_diff1": 0.484454, + "nauc_recall_at_3_max": 0.13346, + "nauc_recall_at_3_std": -0.314498, + "nauc_recall_at_3_diff1": 0.348924, + "nauc_recall_at_5_max": 0.077033, + "nauc_recall_at_5_std": -0.346645, + "nauc_recall_at_5_diff1": 0.283989, + "nauc_recall_at_10_max": 0.115124, + "nauc_recall_at_10_std": -0.483462, + "nauc_recall_at_10_diff1": 0.336443, + "nauc_recall_at_20_max": 0.063023, + "nauc_recall_at_20_std": -0.489831, + "nauc_recall_at_20_diff1": 0.290547, + "nauc_recall_at_100_max": -0.082791, + "nauc_recall_at_100_std": -0.362562, + "nauc_recall_at_100_diff1": 0.250651, + "nauc_recall_at_1000_max": 0.325651, + "nauc_recall_at_1000_std": 0.496804, + "nauc_recall_at_1000_diff1": 0.283168, + "nauc_precision_at_1_max": 0.264662, + "nauc_precision_at_1_std": -0.212828, + "nauc_precision_at_1_diff1": 0.478894, + "nauc_precision_at_3_max": 0.164186, + "nauc_precision_at_3_std": -0.257761, + "nauc_precision_at_3_diff1": 0.262304, + "nauc_precision_at_5_max": 0.10855, + "nauc_precision_at_5_std": -0.268297, + "nauc_precision_at_5_diff1": 0.152323, + "nauc_precision_at_10_max": 0.111564, + "nauc_precision_at_10_std": -0.259956, + "nauc_precision_at_10_diff1": 0.068228, + "nauc_precision_at_20_max": 0.061201, + "nauc_precision_at_20_std": -0.144698, + "nauc_precision_at_20_diff1": -0.056123, + "nauc_precision_at_100_max": 0.025252, + "nauc_precision_at_100_std": 0.039518, + "nauc_precision_at_100_diff1": -0.153637, + "nauc_precision_at_1000_max": 0.021317, + "nauc_precision_at_1000_std": 0.03914, + "nauc_precision_at_1000_diff1": -0.123356, + "nauc_mrr_at_1_max": 0.264662, + "nauc_mrr_at_1_std": -0.212828, + "nauc_mrr_at_1_diff1": 0.478894, + "nauc_mrr_at_3_max": 0.220939, + "nauc_mrr_at_3_std": -0.247549, + "nauc_mrr_at_3_diff1": 0.422949, + "nauc_mrr_at_5_max": 0.21113, + "nauc_mrr_at_5_std": -0.25323, + "nauc_mrr_at_5_diff1": 0.41127, + "nauc_mrr_at_10_max": 0.216621, + "nauc_mrr_at_10_std": -0.261291, + "nauc_mrr_at_10_diff1": 0.420818, + "nauc_mrr_at_20_max": 0.216699, + "nauc_mrr_at_20_std": -0.257568, + "nauc_mrr_at_20_diff1": 0.421523, + "nauc_mrr_at_100_max": 0.217831, + "nauc_mrr_at_100_std": -0.255915, + "nauc_mrr_at_100_diff1": 0.422666, + "nauc_mrr_at_1000_max": 0.217909, + "nauc_mrr_at_1000_std": -0.255828, + "nauc_mrr_at_1000_diff1": 0.422663, + "main_score": 0.58292, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 54.69494819641113, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackMathematicaRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackMathematicaRetrieval.json new file mode 100644 index 000000000..b98e5d603 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackMathematicaRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "90fceea13679c63fe563ded68f3b6f06e50061de", + "task_name": "CQADupstackMathematicaRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.43905, + "ndcg_at_3": 0.54143, + "ndcg_at_5": 0.58288, + "ndcg_at_10": 0.62503, + "ndcg_at_20": 0.64757, + "ndcg_at_100": 0.6668, + "ndcg_at_1000": 0.67027, + "map_at_1": 0.37288, + "map_at_3": 0.48755, + "map_at_5": 0.51582, + "map_at_10": 0.53792, + "map_at_20": 0.5464, + "map_at_100": 0.55109, + "map_at_1000": 0.55142, + "recall_at_1": 0.37288, + "recall_at_3": 0.61148, + "recall_at_5": 0.71176, + "recall_at_10": 0.83006, + "recall_at_20": 0.90272, + "recall_at_100": 0.98081, + "recall_at_1000": 0.99636, + "precision_at_1": 0.43905, + "precision_at_3": 0.25332, + "precision_at_5": 0.18308, + "precision_at_10": 0.11318, + "precision_at_20": 0.06474, + "precision_at_100": 0.01505, + "precision_at_1000": 0.00161, + "mrr_at_1": 0.439055, + "mrr_at_3": 0.551617, + "mrr_at_5": 0.573943, + "mrr_at_10": 0.589125, + "mrr_at_20": 0.593272, + "mrr_at_100": 0.594543, + "mrr_at_1000": 0.594551, + "nauc_ndcg_at_1_max": 0.162096, + "nauc_ndcg_at_1_std": -0.151132, + "nauc_ndcg_at_1_diff1": 0.411167, + "nauc_ndcg_at_3_max": 0.088618, + "nauc_ndcg_at_3_std": -0.241967, + "nauc_ndcg_at_3_diff1": 0.342413, + "nauc_ndcg_at_5_max": 0.074551, + "nauc_ndcg_at_5_std": -0.258041, + "nauc_ndcg_at_5_diff1": 0.33826, + "nauc_ndcg_at_10_max": 0.05871, + "nauc_ndcg_at_10_std": -0.269967, + "nauc_ndcg_at_10_diff1": 0.332542, + "nauc_ndcg_at_20_max": 0.06537, + "nauc_ndcg_at_20_std": -0.266696, + "nauc_ndcg_at_20_diff1": 0.347042, + "nauc_ndcg_at_100_max": 0.088846, + "nauc_ndcg_at_100_std": -0.238945, + "nauc_ndcg_at_100_diff1": 0.351674, + "nauc_ndcg_at_1000_max": 0.089999, + "nauc_ndcg_at_1000_std": -0.240089, + "nauc_ndcg_at_1000_diff1": 0.352177, + "nauc_map_at_1_max": 0.103304, + "nauc_map_at_1_std": -0.165382, + "nauc_map_at_1_diff1": 0.348959, + "nauc_map_at_3_max": 0.087476, + "nauc_map_at_3_std": -0.224698, + "nauc_map_at_3_diff1": 0.335501, + "nauc_map_at_5_max": 0.082928, + "nauc_map_at_5_std": -0.230664, + "nauc_map_at_5_diff1": 0.334956, + "nauc_map_at_10_max": 0.081468, + "nauc_map_at_10_std": -0.233425, + "nauc_map_at_10_diff1": 0.335003, + "nauc_map_at_20_max": 0.082959, + "nauc_map_at_20_std": -0.233544, + "nauc_map_at_20_diff1": 0.339431, + "nauc_map_at_100_max": 0.086381, + "nauc_map_at_100_std": -0.229452, + "nauc_map_at_100_diff1": 0.34064, + "nauc_map_at_1000_max": 0.086483, + "nauc_map_at_1000_std": -0.229556, + "nauc_map_at_1000_diff1": 0.340789, + "nauc_recall_at_1_max": 0.103304, + "nauc_recall_at_1_std": -0.165382, + "nauc_recall_at_1_diff1": 0.348959, + "nauc_recall_at_3_max": 0.026598, + "nauc_recall_at_3_std": -0.292763, + "nauc_recall_at_3_diff1": 0.282337, + "nauc_recall_at_5_max": -0.013414, + "nauc_recall_at_5_std": -0.33322, + "nauc_recall_at_5_diff1": 0.262505, + "nauc_recall_at_10_max": -0.127032, + "nauc_recall_at_10_std": -0.434149, + "nauc_recall_at_10_diff1": 0.21549, + "nauc_recall_at_20_max": -0.198541, + "nauc_recall_at_20_std": -0.520057, + "nauc_recall_at_20_diff1": 0.254342, + "nauc_recall_at_100_max": 0.072213, + "nauc_recall_at_100_std": -0.056245, + "nauc_recall_at_100_diff1": 0.276503, + "nauc_recall_at_1000_max": 0.587166, + "nauc_recall_at_1000_std": 0.49271, + "nauc_recall_at_1000_diff1": 0.533653, + "nauc_precision_at_1_max": 0.162096, + "nauc_precision_at_1_std": -0.151132, + "nauc_precision_at_1_diff1": 0.411167, + "nauc_precision_at_3_max": 0.08915, + "nauc_precision_at_3_std": -0.220558, + "nauc_precision_at_3_diff1": 0.268994, + "nauc_precision_at_5_max": 0.047405, + "nauc_precision_at_5_std": -0.192706, + "nauc_precision_at_5_diff1": 0.186699, + "nauc_precision_at_10_max": 0.004696, + "nauc_precision_at_10_std": -0.120522, + "nauc_precision_at_10_diff1": 0.052485, + "nauc_precision_at_20_max": 0.011718, + "nauc_precision_at_20_std": -0.051367, + "nauc_precision_at_20_diff1": 0.022058, + "nauc_precision_at_100_max": 0.047245, + "nauc_precision_at_100_std": 0.059206, + "nauc_precision_at_100_diff1": -0.04765, + "nauc_precision_at_1000_max": 0.027932, + "nauc_precision_at_1000_std": 0.03938, + "nauc_precision_at_1000_diff1": -0.079657, + "nauc_mrr_at_1_max": 0.162096, + "nauc_mrr_at_1_std": -0.151132, + "nauc_mrr_at_1_diff1": 0.411167, + "nauc_mrr_at_3_max": 0.130528, + "nauc_mrr_at_3_std": -0.213845, + "nauc_mrr_at_3_diff1": 0.386386, + "nauc_mrr_at_5_max": 0.124944, + "nauc_mrr_at_5_std": -0.224879, + "nauc_mrr_at_5_diff1": 0.388699, + "nauc_mrr_at_10_max": 0.116895, + "nauc_mrr_at_10_std": -0.229469, + "nauc_mrr_at_10_diff1": 0.387268, + "nauc_mrr_at_20_max": 0.120381, + "nauc_mrr_at_20_std": -0.225261, + "nauc_mrr_at_20_diff1": 0.389736, + "nauc_mrr_at_100_max": 0.122712, + "nauc_mrr_at_100_std": -0.222463, + "nauc_mrr_at_100_diff1": 0.38974, + "nauc_mrr_at_1000_max": 0.122731, + "nauc_mrr_at_1000_std": -0.222422, + "nauc_mrr_at_1000_diff1": 0.389735, + "main_score": 0.62503, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 33.86972141265869, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackPhysicsRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackPhysicsRetrieval.json new file mode 100644 index 000000000..1bc3911cd --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackPhysicsRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4", + "task_name": "CQADupstackPhysicsRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.51492, + "ndcg_at_3": 0.58961, + "ndcg_at_5": 0.62958, + "ndcg_at_10": 0.66303, + "ndcg_at_20": 0.68623, + "ndcg_at_100": 0.70572, + "ndcg_at_1000": 0.70983, + "map_at_1": 0.42381, + "map_at_3": 0.53454, + "map_at_5": 0.56482, + "map_at_10": 0.58576, + "map_at_20": 0.59533, + "map_at_100": 0.6003, + "map_at_1000": 0.60087, + "recall_at_1": 0.42381, + "recall_at_3": 0.63329, + "recall_at_5": 0.73347, + "recall_at_10": 0.82745, + "recall_at_20": 0.9034, + "recall_at_100": 0.98183, + "recall_at_1000": 0.99841, + "precision_at_1": 0.51492, + "precision_at_3": 0.27976, + "precision_at_5": 0.20212, + "precision_at_10": 0.12243, + "precision_at_20": 0.07026, + "precision_at_100": 0.01664, + "precision_at_1000": 0.00183, + "mrr_at_1": 0.514918, + "mrr_at_3": 0.612127, + "mrr_at_5": 0.633349, + "mrr_at_10": 0.642802, + "mrr_at_20": 0.646713, + "mrr_at_100": 0.648294, + "mrr_at_1000": 0.648315, + "nauc_ndcg_at_1_max": 0.301437, + "nauc_ndcg_at_1_std": -0.17107, + "nauc_ndcg_at_1_diff1": 0.554301, + "nauc_ndcg_at_3_max": 0.259058, + "nauc_ndcg_at_3_std": -0.212162, + "nauc_ndcg_at_3_diff1": 0.482074, + "nauc_ndcg_at_5_max": 0.237147, + "nauc_ndcg_at_5_std": -0.212962, + "nauc_ndcg_at_5_diff1": 0.472031, + "nauc_ndcg_at_10_max": 0.231249, + "nauc_ndcg_at_10_std": -0.23299, + "nauc_ndcg_at_10_diff1": 0.476691, + "nauc_ndcg_at_20_max": 0.241645, + "nauc_ndcg_at_20_std": -0.220323, + "nauc_ndcg_at_20_diff1": 0.47794, + "nauc_ndcg_at_100_max": 0.252023, + "nauc_ndcg_at_100_std": -0.208204, + "nauc_ndcg_at_100_diff1": 0.489048, + "nauc_ndcg_at_1000_max": 0.252544, + "nauc_ndcg_at_1000_std": -0.203415, + "nauc_ndcg_at_1000_diff1": 0.488324, + "nauc_map_at_1_max": 0.236908, + "nauc_map_at_1_std": -0.208936, + "nauc_map_at_1_diff1": 0.537219, + "nauc_map_at_3_max": 0.237709, + "nauc_map_at_3_std": -0.224259, + "nauc_map_at_3_diff1": 0.490216, + "nauc_map_at_5_max": 0.232215, + "nauc_map_at_5_std": -0.222228, + "nauc_map_at_5_diff1": 0.487398, + "nauc_map_at_10_max": 0.235001, + "nauc_map_at_10_std": -0.223725, + "nauc_map_at_10_diff1": 0.488548, + "nauc_map_at_20_max": 0.240961, + "nauc_map_at_20_std": -0.217762, + "nauc_map_at_20_diff1": 0.48957, + "nauc_map_at_100_max": 0.243131, + "nauc_map_at_100_std": -0.214038, + "nauc_map_at_100_diff1": 0.491423, + "nauc_map_at_1000_max": 0.243024, + "nauc_map_at_1000_std": -0.213115, + "nauc_map_at_1000_diff1": 0.491282, + "nauc_recall_at_1_max": 0.236908, + "nauc_recall_at_1_std": -0.208936, + "nauc_recall_at_1_diff1": 0.537219, + "nauc_recall_at_3_max": 0.194616, + "nauc_recall_at_3_std": -0.25572, + "nauc_recall_at_3_diff1": 0.407536, + "nauc_recall_at_5_max": 0.143564, + "nauc_recall_at_5_std": -0.251902, + "nauc_recall_at_5_diff1": 0.359527, + "nauc_recall_at_10_max": 0.10926, + "nauc_recall_at_10_std": -0.337498, + "nauc_recall_at_10_diff1": 0.341044, + "nauc_recall_at_20_max": 0.112184, + "nauc_recall_at_20_std": -0.332093, + "nauc_recall_at_20_diff1": 0.292463, + "nauc_recall_at_100_max": 0.133767, + "nauc_recall_at_100_std": -0.35006, + "nauc_recall_at_100_diff1": 0.339876, + "nauc_recall_at_1000_max": 0.233852, + "nauc_recall_at_1000_std": -0.157022, + "nauc_recall_at_1000_diff1": 0.003765, + "nauc_precision_at_1_max": 0.301437, + "nauc_precision_at_1_std": -0.17107, + "nauc_precision_at_1_diff1": 0.554301, + "nauc_precision_at_3_max": 0.213114, + "nauc_precision_at_3_std": -0.078273, + "nauc_precision_at_3_diff1": 0.21375, + "nauc_precision_at_5_max": 0.136034, + "nauc_precision_at_5_std": 0.011762, + "nauc_precision_at_5_diff1": 0.074522, + "nauc_precision_at_10_max": 0.065189, + "nauc_precision_at_10_std": 0.068775, + "nauc_precision_at_10_diff1": -0.0442, + "nauc_precision_at_20_max": 0.052707, + "nauc_precision_at_20_std": 0.161728, + "nauc_precision_at_20_diff1": -0.119632, + "nauc_precision_at_100_max": -0.000951, + "nauc_precision_at_100_std": 0.240437, + "nauc_precision_at_100_diff1": -0.176598, + "nauc_precision_at_1000_max": -0.042524, + "nauc_precision_at_1000_std": 0.264369, + "nauc_precision_at_1000_diff1": -0.200956, + "nauc_mrr_at_1_max": 0.301437, + "nauc_mrr_at_1_std": -0.17107, + "nauc_mrr_at_1_diff1": 0.554301, + "nauc_mrr_at_3_max": 0.289164, + "nauc_mrr_at_3_std": -0.194478, + "nauc_mrr_at_3_diff1": 0.516591, + "nauc_mrr_at_5_max": 0.281553, + "nauc_mrr_at_5_std": -0.19149, + "nauc_mrr_at_5_diff1": 0.510411, + "nauc_mrr_at_10_max": 0.281937, + "nauc_mrr_at_10_std": -0.195736, + "nauc_mrr_at_10_diff1": 0.513434, + "nauc_mrr_at_20_max": 0.282364, + "nauc_mrr_at_20_std": -0.194641, + "nauc_mrr_at_20_diff1": 0.514046, + "nauc_mrr_at_100_max": 0.283415, + "nauc_mrr_at_100_std": -0.193782, + "nauc_mrr_at_100_diff1": 0.515202, + "nauc_mrr_at_1000_max": 0.28344, + "nauc_mrr_at_1000_std": -0.193778, + "nauc_mrr_at_1000_diff1": 0.515247, + "main_score": 0.66303, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 60.55106854438782, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackProgrammersRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackProgrammersRetrieval.json new file mode 100644 index 000000000..952d95b77 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackProgrammersRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "6184bc1440d2dbc7612be22b50686b8826d22b32", + "task_name": "CQADupstackProgrammersRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.50571, + "ndcg_at_3": 0.59172, + "ndcg_at_5": 0.6275, + "ndcg_at_10": 0.66248, + "ndcg_at_20": 0.68278, + "ndcg_at_100": 0.70255, + "ndcg_at_1000": 0.70575, + "map_at_1": 0.41818, + "map_at_3": 0.53475, + "map_at_5": 0.56304, + "map_at_10": 0.58266, + "map_at_20": 0.5909, + "map_at_100": 0.59619, + "map_at_1000": 0.5966, + "recall_at_1": 0.41818, + "recall_at_3": 0.64501, + "recall_at_5": 0.73859, + "recall_at_10": 0.84141, + "recall_at_20": 0.90812, + "recall_at_100": 0.98455, + "recall_at_1000": 0.99761, + "precision_at_1": 0.50571, + "precision_at_3": 0.28158, + "precision_at_5": 0.2, + "precision_at_10": 0.11906, + "precision_at_20": 0.06787, + "precision_at_100": 0.01623, + "precision_at_1000": 0.00178, + "mrr_at_1": 0.505708, + "mrr_at_3": 0.604072, + "mrr_at_5": 0.624334, + "mrr_at_10": 0.636299, + "mrr_at_20": 0.639904, + "mrr_at_100": 0.641079, + "mrr_at_1000": 0.641086, + "nauc_ndcg_at_1_max": 0.420262, + "nauc_ndcg_at_1_std": -0.05722, + "nauc_ndcg_at_1_diff1": 0.554395, + "nauc_ndcg_at_3_max": 0.329961, + "nauc_ndcg_at_3_std": -0.164216, + "nauc_ndcg_at_3_diff1": 0.48097, + "nauc_ndcg_at_5_max": 0.324239, + "nauc_ndcg_at_5_std": -0.189012, + "nauc_ndcg_at_5_diff1": 0.493926, + "nauc_ndcg_at_10_max": 0.338528, + "nauc_ndcg_at_10_std": -0.180556, + "nauc_ndcg_at_10_diff1": 0.500045, + "nauc_ndcg_at_20_max": 0.350426, + "nauc_ndcg_at_20_std": -0.160641, + "nauc_ndcg_at_20_diff1": 0.50973, + "nauc_ndcg_at_100_max": 0.364175, + "nauc_ndcg_at_100_std": -0.13395, + "nauc_ndcg_at_100_diff1": 0.513674, + "nauc_ndcg_at_1000_max": 0.362218, + "nauc_ndcg_at_1000_std": -0.136452, + "nauc_ndcg_at_1000_diff1": 0.514022, + "nauc_map_at_1_max": 0.326513, + "nauc_map_at_1_std": -0.115315, + "nauc_map_at_1_diff1": 0.559581, + "nauc_map_at_3_max": 0.316138, + "nauc_map_at_3_std": -0.159346, + "nauc_map_at_3_diff1": 0.49392, + "nauc_map_at_5_max": 0.323386, + "nauc_map_at_5_std": -0.16442, + "nauc_map_at_5_diff1": 0.49994, + "nauc_map_at_10_max": 0.335319, + "nauc_map_at_10_std": -0.156957, + "nauc_map_at_10_diff1": 0.503591, + "nauc_map_at_20_max": 0.341801, + "nauc_map_at_20_std": -0.149991, + "nauc_map_at_20_diff1": 0.507969, + "nauc_map_at_100_max": 0.345083, + "nauc_map_at_100_std": -0.144103, + "nauc_map_at_100_diff1": 0.509176, + "nauc_map_at_1000_max": 0.345052, + "nauc_map_at_1000_std": -0.144262, + "nauc_map_at_1000_diff1": 0.509405, + "nauc_recall_at_1_max": 0.326513, + "nauc_recall_at_1_std": -0.115315, + "nauc_recall_at_1_diff1": 0.559581, + "nauc_recall_at_3_max": 0.224063, + "nauc_recall_at_3_std": -0.257213, + "nauc_recall_at_3_diff1": 0.399728, + "nauc_recall_at_5_max": 0.194972, + "nauc_recall_at_5_std": -0.335699, + "nauc_recall_at_5_diff1": 0.402911, + "nauc_recall_at_10_max": 0.2145, + "nauc_recall_at_10_std": -0.363744, + "nauc_recall_at_10_diff1": 0.384851, + "nauc_recall_at_20_max": 0.235492, + "nauc_recall_at_20_std": -0.333723, + "nauc_recall_at_20_diff1": 0.420027, + "nauc_recall_at_100_max": 0.479547, + "nauc_recall_at_100_std": 0.053942, + "nauc_recall_at_100_diff1": 0.433236, + "nauc_recall_at_1000_max": 0.734577, + "nauc_recall_at_1000_std": 0.39924, + "nauc_recall_at_1000_diff1": 0.554157, + "nauc_precision_at_1_max": 0.420262, + "nauc_precision_at_1_std": -0.05722, + "nauc_precision_at_1_diff1": 0.554395, + "nauc_precision_at_3_max": 0.288058, + "nauc_precision_at_3_std": -0.056189, + "nauc_precision_at_3_diff1": 0.19248, + "nauc_precision_at_5_max": 0.225646, + "nauc_precision_at_5_std": -0.032057, + "nauc_precision_at_5_diff1": 0.093968, + "nauc_precision_at_10_max": 0.179763, + "nauc_precision_at_10_std": 0.0659, + "nauc_precision_at_10_diff1": -0.016125, + "nauc_precision_at_20_max": 0.135546, + "nauc_precision_at_20_std": 0.138169, + "nauc_precision_at_20_diff1": -0.071066, + "nauc_precision_at_100_max": 0.059515, + "nauc_precision_at_100_std": 0.202045, + "nauc_precision_at_100_diff1": -0.140951, + "nauc_precision_at_1000_max": -0.021899, + "nauc_precision_at_1000_std": 0.129706, + "nauc_precision_at_1000_diff1": -0.161431, + "nauc_mrr_at_1_max": 0.420262, + "nauc_mrr_at_1_std": -0.05722, + "nauc_mrr_at_1_diff1": 0.554395, + "nauc_mrr_at_3_max": 0.379837, + "nauc_mrr_at_3_std": -0.117873, + "nauc_mrr_at_3_diff1": 0.511615, + "nauc_mrr_at_5_max": 0.377224, + "nauc_mrr_at_5_std": -0.129371, + "nauc_mrr_at_5_diff1": 0.515522, + "nauc_mrr_at_10_max": 0.384478, + "nauc_mrr_at_10_std": -0.12175, + "nauc_mrr_at_10_diff1": 0.520051, + "nauc_mrr_at_20_max": 0.384741, + "nauc_mrr_at_20_std": -0.117426, + "nauc_mrr_at_20_diff1": 0.520716, + "nauc_mrr_at_100_max": 0.384799, + "nauc_mrr_at_100_std": -0.116716, + "nauc_mrr_at_100_diff1": 0.520839, + "nauc_mrr_at_1000_max": 0.384786, + "nauc_mrr_at_1000_std": -0.116704, + "nauc_mrr_at_1000_diff1": 0.520826, + "main_score": 0.66248, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 47.83789134025574, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackStatsRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackStatsRetrieval.json new file mode 100644 index 000000000..526229647 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackStatsRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "65ac3a16b8e91f9cee4c9828cc7c335575432a2a", + "task_name": "CQADupstackStatsRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.39724, + "ndcg_at_3": 0.46347, + "ndcg_at_5": 0.49681, + "ndcg_at_10": 0.54087, + "ndcg_at_20": 0.57353, + "ndcg_at_100": 0.60243, + "ndcg_at_1000": 0.60638, + "map_at_1": 0.3609, + "map_at_3": 0.43038, + "map_at_5": 0.45138, + "map_at_10": 0.47182, + "map_at_20": 0.48222, + "map_at_100": 0.48763, + "map_at_1000": 0.48795, + "recall_at_1": 0.3609, + "recall_at_3": 0.50627, + "recall_at_5": 0.58991, + "recall_at_10": 0.72076, + "recall_at_20": 0.84233, + "recall_at_100": 0.97385, + "recall_at_1000": 0.99719, + "precision_at_1": 0.39724, + "precision_at_3": 0.19632, + "precision_at_5": 0.13926, + "precision_at_10": 0.08819, + "precision_at_20": 0.05276, + "precision_at_100": 0.01308, + "precision_at_1000": 0.00138, + "mrr_at_1": 0.397239, + "mrr_at_3": 0.467025, + "mrr_at_5": 0.485506, + "mrr_at_10": 0.503342, + "mrr_at_20": 0.511334, + "mrr_at_100": 0.514334, + "mrr_at_1000": 0.514408, + "nauc_ndcg_at_1_max": 0.361382, + "nauc_ndcg_at_1_std": -0.10133, + "nauc_ndcg_at_1_diff1": 0.531411, + "nauc_ndcg_at_3_max": 0.294233, + "nauc_ndcg_at_3_std": -0.161553, + "nauc_ndcg_at_3_diff1": 0.475653, + "nauc_ndcg_at_5_max": 0.304694, + "nauc_ndcg_at_5_std": -0.158787, + "nauc_ndcg_at_5_diff1": 0.481962, + "nauc_ndcg_at_10_max": 0.297447, + "nauc_ndcg_at_10_std": -0.169543, + "nauc_ndcg_at_10_diff1": 0.487082, + "nauc_ndcg_at_20_max": 0.291963, + "nauc_ndcg_at_20_std": -0.170743, + "nauc_ndcg_at_20_diff1": 0.477756, + "nauc_ndcg_at_100_max": 0.306578, + "nauc_ndcg_at_100_std": -0.155416, + "nauc_ndcg_at_100_diff1": 0.488914, + "nauc_ndcg_at_1000_max": 0.3096, + "nauc_ndcg_at_1000_std": -0.152675, + "nauc_ndcg_at_1000_diff1": 0.488258, + "nauc_map_at_1_max": 0.300808, + "nauc_map_at_1_std": -0.15718, + "nauc_map_at_1_diff1": 0.516222, + "nauc_map_at_3_max": 0.291135, + "nauc_map_at_3_std": -0.169729, + "nauc_map_at_3_diff1": 0.490269, + "nauc_map_at_5_max": 0.301738, + "nauc_map_at_5_std": -0.161805, + "nauc_map_at_5_diff1": 0.493243, + "nauc_map_at_10_max": 0.30062, + "nauc_map_at_10_std": -0.162607, + "nauc_map_at_10_diff1": 0.493458, + "nauc_map_at_20_max": 0.300899, + "nauc_map_at_20_std": -0.161591, + "nauc_map_at_20_diff1": 0.49109, + "nauc_map_at_100_max": 0.302618, + "nauc_map_at_100_std": -0.159771, + "nauc_map_at_100_diff1": 0.492581, + "nauc_map_at_1000_max": 0.302676, + "nauc_map_at_1000_std": -0.159596, + "nauc_map_at_1000_diff1": 0.492417, + "nauc_recall_at_1_max": 0.300808, + "nauc_recall_at_1_std": -0.15718, + "nauc_recall_at_1_diff1": 0.516222, + "nauc_recall_at_3_max": 0.246082, + "nauc_recall_at_3_std": -0.201788, + "nauc_recall_at_3_diff1": 0.438699, + "nauc_recall_at_5_max": 0.266395, + "nauc_recall_at_5_std": -0.193579, + "nauc_recall_at_5_diff1": 0.441505, + "nauc_recall_at_10_max": 0.223674, + "nauc_recall_at_10_std": -0.231002, + "nauc_recall_at_10_diff1": 0.426187, + "nauc_recall_at_20_max": 0.115303, + "nauc_recall_at_20_std": -0.289978, + "nauc_recall_at_20_diff1": 0.322139, + "nauc_recall_at_100_max": 0.050294, + "nauc_recall_at_100_std": -0.221596, + "nauc_recall_at_100_diff1": 0.328014, + "nauc_recall_at_1000_max": 0.427232, + "nauc_recall_at_1000_std": 0.459048, + "nauc_recall_at_1000_diff1": -0.368438, + "nauc_precision_at_1_max": 0.361382, + "nauc_precision_at_1_std": -0.10133, + "nauc_precision_at_1_diff1": 0.531411, + "nauc_precision_at_3_max": 0.316357, + "nauc_precision_at_3_std": -0.072308, + "nauc_precision_at_3_diff1": 0.383586, + "nauc_precision_at_5_max": 0.325224, + "nauc_precision_at_5_std": -0.012339, + "nauc_precision_at_5_diff1": 0.325957, + "nauc_precision_at_10_max": 0.227025, + "nauc_precision_at_10_std": 0.018247, + "nauc_precision_at_10_diff1": 0.201956, + "nauc_precision_at_20_max": 0.130439, + "nauc_precision_at_20_std": 0.071657, + "nauc_precision_at_20_diff1": 0.026646, + "nauc_precision_at_100_max": 0.064654, + "nauc_precision_at_100_std": 0.182045, + "nauc_precision_at_100_diff1": -0.118889, + "nauc_precision_at_1000_max": 0.041389, + "nauc_precision_at_1000_std": 0.184693, + "nauc_precision_at_1000_diff1": -0.144631, + "nauc_mrr_at_1_max": 0.361382, + "nauc_mrr_at_1_std": -0.10133, + "nauc_mrr_at_1_diff1": 0.531411, + "nauc_mrr_at_3_max": 0.333317, + "nauc_mrr_at_3_std": -0.124978, + "nauc_mrr_at_3_diff1": 0.497462, + "nauc_mrr_at_5_max": 0.337935, + "nauc_mrr_at_5_std": -0.125534, + "nauc_mrr_at_5_diff1": 0.499419, + "nauc_mrr_at_10_max": 0.33449, + "nauc_mrr_at_10_std": -0.131625, + "nauc_mrr_at_10_diff1": 0.502717, + "nauc_mrr_at_20_max": 0.332144, + "nauc_mrr_at_20_std": -0.132128, + "nauc_mrr_at_20_diff1": 0.50034, + "nauc_mrr_at_100_max": 0.333747, + "nauc_mrr_at_100_std": -0.129843, + "nauc_mrr_at_100_diff1": 0.501402, + "nauc_mrr_at_1000_max": 0.333862, + "nauc_mrr_at_1000_std": -0.129801, + "nauc_mrr_at_1000_diff1": 0.501423, + "main_score": 0.54087, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 76.71548318862915, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackTexRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackTexRetrieval.json new file mode 100644 index 000000000..fd36f87c7 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackTexRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "46989137a86843e03a6195de44b09deda022eec7", + "task_name": "CQADupstackTexRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.44701, + "ndcg_at_3": 0.53486, + "ndcg_at_5": 0.56972, + "ndcg_at_10": 0.61119, + "ndcg_at_20": 0.63418, + "ndcg_at_100": 0.65564, + "ndcg_at_1000": 0.66061, + "map_at_1": 0.37651, + "map_at_3": 0.4852, + "map_at_5": 0.5103, + "map_at_10": 0.53134, + "map_at_20": 0.53952, + "map_at_100": 0.5443, + "map_at_1000": 0.54481, + "recall_at_1": 0.37651, + "recall_at_3": 0.59249, + "recall_at_5": 0.68093, + "recall_at_10": 0.80052, + "recall_at_20": 0.8811, + "recall_at_100": 0.97258, + "recall_at_1000": 0.99528, + "precision_at_1": 0.44701, + "precision_at_3": 0.2496, + "precision_at_5": 0.17674, + "precision_at_10": 0.10857, + "precision_at_20": 0.06204, + "precision_at_100": 0.01492, + "precision_at_1000": 0.00167, + "mrr_at_1": 0.447006, + "mrr_at_3": 0.543531, + "mrr_at_5": 0.562767, + "mrr_at_10": 0.578012, + "mrr_at_20": 0.58291, + "mrr_at_100": 0.58486, + "mrr_at_1000": 0.584896, + "nauc_ndcg_at_1_max": 0.32824, + "nauc_ndcg_at_1_std": -0.151496, + "nauc_ndcg_at_1_diff1": 0.511609, + "nauc_ndcg_at_3_max": 0.265845, + "nauc_ndcg_at_3_std": -0.206535, + "nauc_ndcg_at_3_diff1": 0.451959, + "nauc_ndcg_at_5_max": 0.259482, + "nauc_ndcg_at_5_std": -0.216606, + "nauc_ndcg_at_5_diff1": 0.447246, + "nauc_ndcg_at_10_max": 0.254313, + "nauc_ndcg_at_10_std": -0.223218, + "nauc_ndcg_at_10_diff1": 0.44817, + "nauc_ndcg_at_20_max": 0.261289, + "nauc_ndcg_at_20_std": -0.220355, + "nauc_ndcg_at_20_diff1": 0.45121, + "nauc_ndcg_at_100_max": 0.270613, + "nauc_ndcg_at_100_std": -0.202889, + "nauc_ndcg_at_100_diff1": 0.460271, + "nauc_ndcg_at_1000_max": 0.271676, + "nauc_ndcg_at_1000_std": -0.202044, + "nauc_ndcg_at_1000_diff1": 0.462126, + "nauc_map_at_1_max": 0.269914, + "nauc_map_at_1_std": -0.156609, + "nauc_map_at_1_diff1": 0.502334, + "nauc_map_at_3_max": 0.261146, + "nauc_map_at_3_std": -0.197019, + "nauc_map_at_3_diff1": 0.462147, + "nauc_map_at_5_max": 0.261412, + "nauc_map_at_5_std": -0.202905, + "nauc_map_at_5_diff1": 0.458687, + "nauc_map_at_10_max": 0.262169, + "nauc_map_at_10_std": -0.204186, + "nauc_map_at_10_diff1": 0.459665, + "nauc_map_at_20_max": 0.265104, + "nauc_map_at_20_std": -0.202959, + "nauc_map_at_20_diff1": 0.460859, + "nauc_map_at_100_max": 0.267046, + "nauc_map_at_100_std": -0.199832, + "nauc_map_at_100_diff1": 0.462439, + "nauc_map_at_1000_max": 0.267247, + "nauc_map_at_1000_std": -0.19974, + "nauc_map_at_1000_diff1": 0.462734, + "nauc_recall_at_1_max": 0.269914, + "nauc_recall_at_1_std": -0.156609, + "nauc_recall_at_1_diff1": 0.502334, + "nauc_recall_at_3_max": 0.200059, + "nauc_recall_at_3_std": -0.239211, + "nauc_recall_at_3_diff1": 0.390804, + "nauc_recall_at_5_max": 0.181926, + "nauc_recall_at_5_std": -0.267449, + "nauc_recall_at_5_diff1": 0.367754, + "nauc_recall_at_10_max": 0.130795, + "nauc_recall_at_10_std": -0.313187, + "nauc_recall_at_10_diff1": 0.337816, + "nauc_recall_at_20_max": 0.126863, + "nauc_recall_at_20_std": -0.349119, + "nauc_recall_at_20_diff1": 0.300834, + "nauc_recall_at_100_max": 0.168818, + "nauc_recall_at_100_std": -0.135934, + "nauc_recall_at_100_diff1": 0.249535, + "nauc_recall_at_1000_max": 0.205097, + "nauc_recall_at_1000_std": 0.141433, + "nauc_recall_at_1000_diff1": 0.193485, + "nauc_precision_at_1_max": 0.32824, + "nauc_precision_at_1_std": -0.151496, + "nauc_precision_at_1_diff1": 0.511609, + "nauc_precision_at_3_max": 0.233682, + "nauc_precision_at_3_std": -0.174714, + "nauc_precision_at_3_diff1": 0.273479, + "nauc_precision_at_5_max": 0.190349, + "nauc_precision_at_5_std": -0.154284, + "nauc_precision_at_5_diff1": 0.180747, + "nauc_precision_at_10_max": 0.119964, + "nauc_precision_at_10_std": -0.098852, + "nauc_precision_at_10_diff1": 0.067343, + "nauc_precision_at_20_max": 0.085429, + "nauc_precision_at_20_std": -0.028956, + "nauc_precision_at_20_diff1": -0.011926, + "nauc_precision_at_100_max": 0.030566, + "nauc_precision_at_100_std": 0.064346, + "nauc_precision_at_100_diff1": -0.070841, + "nauc_precision_at_1000_max": 0.007398, + "nauc_precision_at_1000_std": 0.064069, + "nauc_precision_at_1000_diff1": -0.072905, + "nauc_mrr_at_1_max": 0.32824, + "nauc_mrr_at_1_std": -0.151496, + "nauc_mrr_at_1_diff1": 0.511609, + "nauc_mrr_at_3_max": 0.291949, + "nauc_mrr_at_3_std": -0.189044, + "nauc_mrr_at_3_diff1": 0.469379, + "nauc_mrr_at_5_max": 0.291698, + "nauc_mrr_at_5_std": -0.191687, + "nauc_mrr_at_5_diff1": 0.470267, + "nauc_mrr_at_10_max": 0.291766, + "nauc_mrr_at_10_std": -0.192544, + "nauc_mrr_at_10_diff1": 0.471621, + "nauc_mrr_at_20_max": 0.293373, + "nauc_mrr_at_20_std": -0.191699, + "nauc_mrr_at_20_diff1": 0.472396, + "nauc_mrr_at_100_max": 0.294099, + "nauc_mrr_at_100_std": -0.189782, + "nauc_mrr_at_100_diff1": 0.473037, + "nauc_mrr_at_1000_max": 0.294098, + "nauc_mrr_at_1000_std": -0.189765, + "nauc_mrr_at_1000_diff1": 0.473053, + "main_score": 0.61119, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 130.09497570991516, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackUnixRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackUnixRetrieval.json new file mode 100644 index 000000000..85a8aad59 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackUnixRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "6c6430d3a6d36f8d2a829195bc5dc94d7e063e53", + "task_name": "CQADupstackUnixRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.46549, + "ndcg_at_3": 0.55316, + "ndcg_at_5": 0.58539, + "ndcg_at_10": 0.62236, + "ndcg_at_20": 0.64486, + "ndcg_at_100": 0.66832, + "ndcg_at_1000": 0.67303, + "map_at_1": 0.4027, + "map_at_3": 0.5053, + "map_at_5": 0.52815, + "map_at_10": 0.54722, + "map_at_20": 0.55532, + "map_at_100": 0.56038, + "map_at_1000": 0.56088, + "recall_at_1": 0.4027, + "recall_at_3": 0.60968, + "recall_at_5": 0.69323, + "recall_at_10": 0.79883, + "recall_at_20": 0.87508, + "recall_at_100": 0.97523, + "recall_at_1000": 0.99835, + "precision_at_1": 0.46549, + "precision_at_3": 0.25373, + "precision_at_5": 0.17724, + "precision_at_10": 0.10625, + "precision_at_20": 0.06077, + "precision_at_100": 0.01459, + "precision_at_1000": 0.00157, + "mrr_at_1": 0.465485, + "mrr_at_3": 0.560945, + "mrr_at_5": 0.580302, + "mrr_at_10": 0.593375, + "mrr_at_20": 0.597766, + "mrr_at_100": 0.599764, + "mrr_at_1000": 0.599824, + "nauc_ndcg_at_1_max": 0.407193, + "nauc_ndcg_at_1_std": -0.129962, + "nauc_ndcg_at_1_diff1": 0.544721, + "nauc_ndcg_at_3_max": 0.325582, + "nauc_ndcg_at_3_std": -0.212115, + "nauc_ndcg_at_3_diff1": 0.459968, + "nauc_ndcg_at_5_max": 0.318117, + "nauc_ndcg_at_5_std": -0.221623, + "nauc_ndcg_at_5_diff1": 0.454845, + "nauc_ndcg_at_10_max": 0.31758, + "nauc_ndcg_at_10_std": -0.227036, + "nauc_ndcg_at_10_diff1": 0.462159, + "nauc_ndcg_at_20_max": 0.323231, + "nauc_ndcg_at_20_std": -0.220688, + "nauc_ndcg_at_20_diff1": 0.467868, + "nauc_ndcg_at_100_max": 0.333193, + "nauc_ndcg_at_100_std": -0.201221, + "nauc_ndcg_at_100_diff1": 0.475366, + "nauc_ndcg_at_1000_max": 0.33595, + "nauc_ndcg_at_1000_std": -0.197463, + "nauc_ndcg_at_1000_diff1": 0.474573, + "nauc_map_at_1_max": 0.329966, + "nauc_map_at_1_std": -0.152349, + "nauc_map_at_1_diff1": 0.532832, + "nauc_map_at_3_max": 0.32874, + "nauc_map_at_3_std": -0.198955, + "nauc_map_at_3_diff1": 0.480926, + "nauc_map_at_5_max": 0.328586, + "nauc_map_at_5_std": -0.199987, + "nauc_map_at_5_diff1": 0.473715, + "nauc_map_at_10_max": 0.32994, + "nauc_map_at_10_std": -0.199811, + "nauc_map_at_10_diff1": 0.4763, + "nauc_map_at_20_max": 0.33128, + "nauc_map_at_20_std": -0.19825, + "nauc_map_at_20_diff1": 0.477652, + "nauc_map_at_100_max": 0.332977, + "nauc_map_at_100_std": -0.19516, + "nauc_map_at_100_diff1": 0.478798, + "nauc_map_at_1000_max": 0.33308, + "nauc_map_at_1000_std": -0.194807, + "nauc_map_at_1000_diff1": 0.478753, + "nauc_recall_at_1_max": 0.329966, + "nauc_recall_at_1_std": -0.152349, + "nauc_recall_at_1_diff1": 0.532832, + "nauc_recall_at_3_max": 0.252158, + "nauc_recall_at_3_std": -0.279205, + "nauc_recall_at_3_diff1": 0.398941, + "nauc_recall_at_5_max": 0.226424, + "nauc_recall_at_5_std": -0.299471, + "nauc_recall_at_5_diff1": 0.355565, + "nauc_recall_at_10_max": 0.173016, + "nauc_recall_at_10_std": -0.377048, + "nauc_recall_at_10_diff1": 0.349342, + "nauc_recall_at_20_max": 0.153475, + "nauc_recall_at_20_std": -0.40948, + "nauc_recall_at_20_diff1": 0.345414, + "nauc_recall_at_100_max": 0.105252, + "nauc_recall_at_100_std": -0.31024, + "nauc_recall_at_100_diff1": 0.402422, + "nauc_recall_at_1000_max": 0.620666, + "nauc_recall_at_1000_std": 0.553005, + "nauc_recall_at_1000_diff1": 0.414723, + "nauc_precision_at_1_max": 0.407193, + "nauc_precision_at_1_std": -0.129962, + "nauc_precision_at_1_diff1": 0.544721, + "nauc_precision_at_3_max": 0.29009, + "nauc_precision_at_3_std": -0.159591, + "nauc_precision_at_3_diff1": 0.248618, + "nauc_precision_at_5_max": 0.213061, + "nauc_precision_at_5_std": -0.137149, + "nauc_precision_at_5_diff1": 0.138471, + "nauc_precision_at_10_max": 0.115655, + "nauc_precision_at_10_std": -0.067191, + "nauc_precision_at_10_diff1": 0.023775, + "nauc_precision_at_20_max": 0.038022, + "nauc_precision_at_20_std": -0.009051, + "nauc_precision_at_20_diff1": -0.062387, + "nauc_precision_at_100_max": -0.049607, + "nauc_precision_at_100_std": 0.099015, + "nauc_precision_at_100_diff1": -0.160546, + "nauc_precision_at_1000_max": -0.070688, + "nauc_precision_at_1000_std": 0.104483, + "nauc_precision_at_1000_diff1": -0.18079, + "nauc_mrr_at_1_max": 0.407193, + "nauc_mrr_at_1_std": -0.129962, + "nauc_mrr_at_1_diff1": 0.544721, + "nauc_mrr_at_3_max": 0.364489, + "nauc_mrr_at_3_std": -0.178728, + "nauc_mrr_at_3_diff1": 0.487224, + "nauc_mrr_at_5_max": 0.364074, + "nauc_mrr_at_5_std": -0.180061, + "nauc_mrr_at_5_diff1": 0.485654, + "nauc_mrr_at_10_max": 0.36318, + "nauc_mrr_at_10_std": -0.18171, + "nauc_mrr_at_10_diff1": 0.488332, + "nauc_mrr_at_20_max": 0.365121, + "nauc_mrr_at_20_std": -0.179388, + "nauc_mrr_at_20_diff1": 0.490044, + "nauc_mrr_at_100_max": 0.365944, + "nauc_mrr_at_100_std": -0.177867, + "nauc_mrr_at_100_diff1": 0.490569, + "nauc_mrr_at_1000_max": 0.366002, + "nauc_mrr_at_1000_std": -0.177812, + "nauc_mrr_at_1000_diff1": 0.490557, + "main_score": 0.62236, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 68.6236310005188, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackWebmastersRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackWebmastersRetrieval.json new file mode 100644 index 000000000..8323cfc66 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackWebmastersRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "160c094312a0e1facb97e55eeddb698c0abe3571", + "task_name": "CQADupstackWebmastersRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.51383, + "ndcg_at_3": 0.60394, + "ndcg_at_5": 0.64136, + "ndcg_at_10": 0.67357, + "ndcg_at_20": 0.69415, + "ndcg_at_100": 0.71024, + "ndcg_at_1000": 0.71603, + "map_at_1": 0.43062, + "map_at_3": 0.54393, + "map_at_5": 0.57311, + "map_at_10": 0.59256, + "map_at_20": 0.60259, + "map_at_100": 0.60959, + "map_at_1000": 0.61118, + "recall_at_1": 0.43062, + "recall_at_3": 0.65001, + "recall_at_5": 0.74747, + "recall_at_10": 0.83879, + "recall_at_20": 0.91218, + "recall_at_100": 0.9785, + "recall_at_1000": 0.99763, + "precision_at_1": 0.51383, + "precision_at_3": 0.28458, + "precision_at_5": 0.20553, + "precision_at_10": 0.12628, + "precision_at_20": 0.07549, + "precision_at_100": 0.02028, + "precision_at_1000": 0.00263, + "mrr_at_1": 0.513834, + "mrr_at_3": 0.609025, + "mrr_at_5": 0.629183, + "mrr_at_10": 0.640487, + "mrr_at_20": 0.644826, + "mrr_at_100": 0.64598, + "mrr_at_1000": 0.645996, + "nauc_ndcg_at_1_max": 0.331533, + "nauc_ndcg_at_1_std": -0.19399, + "nauc_ndcg_at_1_diff1": 0.528428, + "nauc_ndcg_at_3_max": 0.294875, + "nauc_ndcg_at_3_std": -0.240604, + "nauc_ndcg_at_3_diff1": 0.491861, + "nauc_ndcg_at_5_max": 0.275618, + "nauc_ndcg_at_5_std": -0.280837, + "nauc_ndcg_at_5_diff1": 0.479552, + "nauc_ndcg_at_10_max": 0.26233, + "nauc_ndcg_at_10_std": -0.303086, + "nauc_ndcg_at_10_diff1": 0.478674, + "nauc_ndcg_at_20_max": 0.276383, + "nauc_ndcg_at_20_std": -0.292356, + "nauc_ndcg_at_20_diff1": 0.491835, + "nauc_ndcg_at_100_max": 0.292747, + "nauc_ndcg_at_100_std": -0.268215, + "nauc_ndcg_at_100_diff1": 0.494612, + "nauc_ndcg_at_1000_max": 0.288606, + "nauc_ndcg_at_1000_std": -0.265283, + "nauc_ndcg_at_1000_diff1": 0.492014, + "nauc_map_at_1_max": 0.3064, + "nauc_map_at_1_std": -0.219784, + "nauc_map_at_1_diff1": 0.569571, + "nauc_map_at_3_max": 0.301383, + "nauc_map_at_3_std": -0.25765, + "nauc_map_at_3_diff1": 0.515614, + "nauc_map_at_5_max": 0.300625, + "nauc_map_at_5_std": -0.276376, + "nauc_map_at_5_diff1": 0.499819, + "nauc_map_at_10_max": 0.29896, + "nauc_map_at_10_std": -0.283944, + "nauc_map_at_10_diff1": 0.495973, + "nauc_map_at_20_max": 0.303817, + "nauc_map_at_20_std": -0.277709, + "nauc_map_at_20_diff1": 0.501449, + "nauc_map_at_100_max": 0.305607, + "nauc_map_at_100_std": -0.265261, + "nauc_map_at_100_diff1": 0.505225, + "nauc_map_at_1000_max": 0.30428, + "nauc_map_at_1000_std": -0.264638, + "nauc_map_at_1000_diff1": 0.506548, + "nauc_recall_at_1_max": 0.3064, + "nauc_recall_at_1_std": -0.219784, + "nauc_recall_at_1_diff1": 0.569571, + "nauc_recall_at_3_max": 0.224601, + "nauc_recall_at_3_std": -0.298838, + "nauc_recall_at_3_diff1": 0.43738, + "nauc_recall_at_5_max": 0.164785, + "nauc_recall_at_5_std": -0.419582, + "nauc_recall_at_5_diff1": 0.362594, + "nauc_recall_at_10_max": 0.056132, + "nauc_recall_at_10_std": -0.547643, + "nauc_recall_at_10_diff1": 0.321686, + "nauc_recall_at_20_max": 0.032501, + "nauc_recall_at_20_std": -0.617554, + "nauc_recall_at_20_diff1": 0.333094, + "nauc_recall_at_100_max": 0.274523, + "nauc_recall_at_100_std": -0.277233, + "nauc_recall_at_100_diff1": 0.52044, + "nauc_recall_at_1000_max": 0.50261, + "nauc_recall_at_1000_std": 0.022324, + "nauc_recall_at_1000_diff1": 0.467846, + "nauc_precision_at_1_max": 0.331533, + "nauc_precision_at_1_std": -0.19399, + "nauc_precision_at_1_diff1": 0.528428, + "nauc_precision_at_3_max": 0.197896, + "nauc_precision_at_3_std": -0.103175, + "nauc_precision_at_3_diff1": 0.144209, + "nauc_precision_at_5_max": 0.116084, + "nauc_precision_at_5_std": -0.063097, + "nauc_precision_at_5_diff1": -0.003701, + "nauc_precision_at_10_max": -0.009036, + "nauc_precision_at_10_std": 0.015011, + "nauc_precision_at_10_diff1": -0.114509, + "nauc_precision_at_20_max": -0.039853, + "nauc_precision_at_20_std": 0.146993, + "nauc_precision_at_20_diff1": -0.131884, + "nauc_precision_at_100_max": -0.10833, + "nauc_precision_at_100_std": 0.290196, + "nauc_precision_at_100_diff1": -0.098555, + "nauc_precision_at_1000_max": -0.207762, + "nauc_precision_at_1000_std": 0.14973, + "nauc_precision_at_1000_diff1": -0.115938, + "nauc_mrr_at_1_max": 0.331533, + "nauc_mrr_at_1_std": -0.19399, + "nauc_mrr_at_1_diff1": 0.528428, + "nauc_mrr_at_3_max": 0.296529, + "nauc_mrr_at_3_std": -0.2201, + "nauc_mrr_at_3_diff1": 0.490831, + "nauc_mrr_at_5_max": 0.291707, + "nauc_mrr_at_5_std": -0.239026, + "nauc_mrr_at_5_diff1": 0.487315, + "nauc_mrr_at_10_max": 0.288127, + "nauc_mrr_at_10_std": -0.241413, + "nauc_mrr_at_10_diff1": 0.490464, + "nauc_mrr_at_20_max": 0.291937, + "nauc_mrr_at_20_std": -0.235374, + "nauc_mrr_at_20_diff1": 0.491827, + "nauc_mrr_at_100_max": 0.294109, + "nauc_mrr_at_100_std": -0.233056, + "nauc_mrr_at_100_diff1": 0.493141, + "nauc_mrr_at_1000_max": 0.294067, + "nauc_mrr_at_1000_std": -0.233121, + "nauc_mrr_at_1000_diff1": 0.493118, + "main_score": 0.67357, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 22.354535579681396, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackWordpressRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackWordpressRetrieval.json new file mode 100644 index 000000000..b9f301cf2 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/CQADupstackWordpressRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "4ffe81d471b1924886b33c7567bfb200e9eec5c4", + "task_name": "CQADupstackWordpressRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.32163, + "ndcg_at_3": 0.39912, + "ndcg_at_5": 0.43178, + "ndcg_at_10": 0.47129, + "ndcg_at_20": 0.50312, + "ndcg_at_100": 0.54158, + "ndcg_at_1000": 0.5486, + "map_at_1": 0.29119, + "map_at_3": 0.36784, + "map_at_5": 0.38726, + "map_at_10": 0.40536, + "map_at_20": 0.41475, + "map_at_100": 0.42121, + "map_at_1000": 0.42168, + "recall_at_1": 0.29119, + "recall_at_3": 0.45989, + "recall_at_5": 0.53795, + "recall_at_10": 0.65228, + "recall_at_20": 0.7701, + "recall_at_100": 0.95523, + "recall_at_1000": 0.99813, + "precision_at_1": 0.32163, + "precision_at_3": 0.17252, + "precision_at_5": 0.12163, + "precision_at_10": 0.07542, + "precision_at_20": 0.04538, + "precision_at_100": 0.01183, + "precision_at_1000": 0.00134, + "mrr_at_1": 0.321627, + "mrr_at_3": 0.395872, + "mrr_at_5": 0.414264, + "mrr_at_10": 0.429326, + "mrr_at_20": 0.437979, + "mrr_at_100": 0.442904, + "mrr_at_1000": 0.443078, + "nauc_ndcg_at_1_max": 0.456803, + "nauc_ndcg_at_1_std": -0.101888, + "nauc_ndcg_at_1_diff1": 0.576678, + "nauc_ndcg_at_3_max": 0.365358, + "nauc_ndcg_at_3_std": -0.103559, + "nauc_ndcg_at_3_diff1": 0.489735, + "nauc_ndcg_at_5_max": 0.346385, + "nauc_ndcg_at_5_std": -0.133599, + "nauc_ndcg_at_5_diff1": 0.4732, + "nauc_ndcg_at_10_max": 0.336232, + "nauc_ndcg_at_10_std": -0.134143, + "nauc_ndcg_at_10_diff1": 0.466525, + "nauc_ndcg_at_20_max": 0.332748, + "nauc_ndcg_at_20_std": -0.129531, + "nauc_ndcg_at_20_diff1": 0.465179, + "nauc_ndcg_at_100_max": 0.352546, + "nauc_ndcg_at_100_std": -0.125783, + "nauc_ndcg_at_100_diff1": 0.484376, + "nauc_ndcg_at_1000_max": 0.357898, + "nauc_ndcg_at_1000_std": -0.119993, + "nauc_ndcg_at_1000_diff1": 0.488115, + "nauc_map_at_1_max": 0.413783, + "nauc_map_at_1_std": -0.131075, + "nauc_map_at_1_diff1": 0.57934, + "nauc_map_at_3_max": 0.371835, + "nauc_map_at_3_std": -0.110604, + "nauc_map_at_3_diff1": 0.50627, + "nauc_map_at_5_max": 0.365089, + "nauc_map_at_5_std": -0.125709, + "nauc_map_at_5_diff1": 0.499087, + "nauc_map_at_10_max": 0.36134, + "nauc_map_at_10_std": -0.12409, + "nauc_map_at_10_diff1": 0.497485, + "nauc_map_at_20_max": 0.360913, + "nauc_map_at_20_std": -0.121782, + "nauc_map_at_20_diff1": 0.497715, + "nauc_map_at_100_max": 0.364018, + "nauc_map_at_100_std": -0.12054, + "nauc_map_at_100_diff1": 0.500675, + "nauc_map_at_1000_max": 0.364129, + "nauc_map_at_1000_std": -0.120328, + "nauc_map_at_1000_diff1": 0.500788, + "nauc_recall_at_1_max": 0.413783, + "nauc_recall_at_1_std": -0.131075, + "nauc_recall_at_1_diff1": 0.57934, + "nauc_recall_at_3_max": 0.298879, + "nauc_recall_at_3_std": -0.108827, + "nauc_recall_at_3_diff1": 0.419921, + "nauc_recall_at_5_max": 0.246836, + "nauc_recall_at_5_std": -0.174099, + "nauc_recall_at_5_diff1": 0.369029, + "nauc_recall_at_10_max": 0.199989, + "nauc_recall_at_10_std": -0.195206, + "nauc_recall_at_10_diff1": 0.334429, + "nauc_recall_at_20_max": 0.13375, + "nauc_recall_at_20_std": -0.197934, + "nauc_recall_at_20_diff1": 0.279317, + "nauc_recall_at_100_max": 0.01759, + "nauc_recall_at_100_std": -0.391487, + "nauc_recall_at_100_diff1": 0.208902, + "nauc_recall_at_1000_max": 0.538588, + "nauc_recall_at_1000_std": 0.764463, + "nauc_recall_at_1000_diff1": 0.148139, + "nauc_precision_at_1_max": 0.456803, + "nauc_precision_at_1_std": -0.101888, + "nauc_precision_at_1_diff1": 0.576678, + "nauc_precision_at_3_max": 0.328845, + "nauc_precision_at_3_std": -0.053524, + "nauc_precision_at_3_diff1": 0.389841, + "nauc_precision_at_5_max": 0.291318, + "nauc_precision_at_5_std": -0.102324, + "nauc_precision_at_5_diff1": 0.340046, + "nauc_precision_at_10_max": 0.211602, + "nauc_precision_at_10_std": -0.059966, + "nauc_precision_at_10_diff1": 0.254596, + "nauc_precision_at_20_max": 0.116455, + "nauc_precision_at_20_std": -0.007918, + "nauc_precision_at_20_diff1": 0.136255, + "nauc_precision_at_100_max": -0.00964, + "nauc_precision_at_100_std": 0.084865, + "nauc_precision_at_100_diff1": -0.076214, + "nauc_precision_at_1000_max": -0.15356, + "nauc_precision_at_1000_std": -0.014555, + "nauc_precision_at_1000_diff1": -0.188146, + "nauc_mrr_at_1_max": 0.456803, + "nauc_mrr_at_1_std": -0.101888, + "nauc_mrr_at_1_diff1": 0.576678, + "nauc_mrr_at_3_max": 0.410251, + "nauc_mrr_at_3_std": -0.089837, + "nauc_mrr_at_3_diff1": 0.517665, + "nauc_mrr_at_5_max": 0.396397, + "nauc_mrr_at_5_std": -0.10616, + "nauc_mrr_at_5_diff1": 0.506898, + "nauc_mrr_at_10_max": 0.393767, + "nauc_mrr_at_10_std": -0.10593, + "nauc_mrr_at_10_diff1": 0.50405, + "nauc_mrr_at_20_max": 0.393802, + "nauc_mrr_at_20_std": -0.105429, + "nauc_mrr_at_20_diff1": 0.504437, + "nauc_mrr_at_100_max": 0.396748, + "nauc_mrr_at_100_std": -0.105133, + "nauc_mrr_at_100_diff1": 0.507837, + "nauc_mrr_at_1000_max": 0.396898, + "nauc_mrr_at_1000_std": -0.104893, + "nauc_mrr_at_1000_diff1": 0.507977, + "main_score": 0.47129, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 75.03050684928894, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/ClimateFEVER.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/ClimateFEVER.json new file mode 100644 index 000000000..7ac82d812 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/ClimateFEVER.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "47f2ac6acb640fc46020b02a5b59fdda04d39380", + "task_name": "ClimateFEVER", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.50554, + "ndcg_at_3": 0.43898, + "ndcg_at_5": 0.46564, + "ndcg_at_10": 0.5149, + "ndcg_at_20": 0.5486, + "ndcg_at_100": 0.5896, + "ndcg_at_1000": 0.60925, + "map_at_1": 0.21877, + "map_at_3": 0.33727, + "map_at_5": 0.37524, + "map_at_10": 0.40536, + "map_at_20": 0.42032, + "map_at_100": 0.43013, + "map_at_1000": 0.43154, + "recall_at_1": 0.21877, + "recall_at_3": 0.39606, + "recall_at_5": 0.48091, + "recall_at_10": 0.58859, + "recall_at_20": 0.68067, + "recall_at_100": 0.83055, + "recall_at_1000": 0.93482, + "precision_at_1": 0.50554, + "precision_at_3": 0.33659, + "precision_at_5": 0.25329, + "precision_at_10": 0.16007, + "precision_at_20": 0.09505, + "precision_at_100": 0.02418, + "precision_at_1000": 0.00279, + "mrr_at_1": 0.505537, + "mrr_at_3": 0.608469, + "mrr_at_5": 0.621531, + "mrr_at_10": 0.631471, + "mrr_at_20": 0.635007, + "mrr_at_100": 0.636706, + "mrr_at_1000": 0.636813, + "nauc_ndcg_at_1_max": 0.264607, + "nauc_ndcg_at_1_std": 0.106172, + "nauc_ndcg_at_1_diff1": 0.343281, + "nauc_ndcg_at_3_max": 0.294175, + "nauc_ndcg_at_3_std": 0.135463, + "nauc_ndcg_at_3_diff1": 0.277207, + "nauc_ndcg_at_5_max": 0.305643, + "nauc_ndcg_at_5_std": 0.148844, + "nauc_ndcg_at_5_diff1": 0.281792, + "nauc_ndcg_at_10_max": 0.309079, + "nauc_ndcg_at_10_std": 0.16496, + "nauc_ndcg_at_10_diff1": 0.284321, + "nauc_ndcg_at_20_max": 0.319792, + "nauc_ndcg_at_20_std": 0.18369, + "nauc_ndcg_at_20_diff1": 0.295666, + "nauc_ndcg_at_100_max": 0.323319, + "nauc_ndcg_at_100_std": 0.191662, + "nauc_ndcg_at_100_diff1": 0.299658, + "nauc_ndcg_at_1000_max": 0.322351, + "nauc_ndcg_at_1000_std": 0.190251, + "nauc_ndcg_at_1000_diff1": 0.30085, + "nauc_map_at_1_max": 0.307554, + "nauc_map_at_1_std": 0.071273, + "nauc_map_at_1_diff1": 0.361357, + "nauc_map_at_3_max": 0.31241, + "nauc_map_at_3_std": 0.125629, + "nauc_map_at_3_diff1": 0.290145, + "nauc_map_at_5_max": 0.314699, + "nauc_map_at_5_std": 0.138073, + "nauc_map_at_5_diff1": 0.285658, + "nauc_map_at_10_max": 0.317118, + "nauc_map_at_10_std": 0.148662, + "nauc_map_at_10_diff1": 0.287584, + "nauc_map_at_20_max": 0.322759, + "nauc_map_at_20_std": 0.157774, + "nauc_map_at_20_diff1": 0.291277, + "nauc_map_at_100_max": 0.32407, + "nauc_map_at_100_std": 0.161035, + "nauc_map_at_100_diff1": 0.29261, + "nauc_map_at_1000_max": 0.324157, + "nauc_map_at_1000_std": 0.161241, + "nauc_map_at_1000_diff1": 0.292586, + "nauc_recall_at_1_max": 0.307554, + "nauc_recall_at_1_std": 0.071273, + "nauc_recall_at_1_diff1": 0.361357, + "nauc_recall_at_3_max": 0.294726, + "nauc_recall_at_3_std": 0.13527, + "nauc_recall_at_3_diff1": 0.24983, + "nauc_recall_at_5_max": 0.284626, + "nauc_recall_at_5_std": 0.154379, + "nauc_recall_at_5_diff1": 0.225643, + "nauc_recall_at_10_max": 0.281697, + "nauc_recall_at_10_std": 0.180473, + "nauc_recall_at_10_diff1": 0.22315, + "nauc_recall_at_20_max": 0.305892, + "nauc_recall_at_20_std": 0.232925, + "nauc_recall_at_20_diff1": 0.247555, + "nauc_recall_at_100_max": 0.330156, + "nauc_recall_at_100_std": 0.30297, + "nauc_recall_at_100_diff1": 0.257315, + "nauc_recall_at_1000_max": 0.381743, + "nauc_recall_at_1000_std": 0.441079, + "nauc_recall_at_1000_diff1": 0.298396, + "nauc_precision_at_1_max": 0.264607, + "nauc_precision_at_1_std": 0.106172, + "nauc_precision_at_1_diff1": 0.343281, + "nauc_precision_at_3_max": 0.200444, + "nauc_precision_at_3_std": 0.160278, + "nauc_precision_at_3_diff1": 0.144584, + "nauc_precision_at_5_max": 0.167021, + "nauc_precision_at_5_std": 0.165345, + "nauc_precision_at_5_diff1": 0.108599, + "nauc_precision_at_10_max": 0.126103, + "nauc_precision_at_10_std": 0.180016, + "nauc_precision_at_10_diff1": 0.064595, + "nauc_precision_at_20_max": 0.104932, + "nauc_precision_at_20_std": 0.203481, + "nauc_precision_at_20_diff1": 0.048236, + "nauc_precision_at_100_max": -0.009293, + "nauc_precision_at_100_std": 0.165296, + "nauc_precision_at_100_diff1": -0.057615, + "nauc_precision_at_1000_max": -0.124443, + "nauc_precision_at_1000_std": 0.092289, + "nauc_precision_at_1000_diff1": -0.15163, + "nauc_mrr_at_1_max": 0.264607, + "nauc_mrr_at_1_std": 0.106172, + "nauc_mrr_at_1_diff1": 0.343281, + "nauc_mrr_at_3_max": 0.27089, + "nauc_mrr_at_3_std": 0.125907, + "nauc_mrr_at_3_diff1": 0.319809, + "nauc_mrr_at_5_max": 0.270426, + "nauc_mrr_at_5_std": 0.129639, + "nauc_mrr_at_5_diff1": 0.316698, + "nauc_mrr_at_10_max": 0.270662, + "nauc_mrr_at_10_std": 0.131182, + "nauc_mrr_at_10_diff1": 0.319037, + "nauc_mrr_at_20_max": 0.271426, + "nauc_mrr_at_20_std": 0.131821, + "nauc_mrr_at_20_diff1": 0.321603, + "nauc_mrr_at_100_max": 0.271219, + "nauc_mrr_at_100_std": 0.130777, + "nauc_mrr_at_100_diff1": 0.321275, + "nauc_mrr_at_1000_max": 0.271208, + "nauc_mrr_at_1000_std": 0.130692, + "nauc_mrr_at_1000_diff1": 0.321239, + "main_score": 0.5149, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 4138.002898216248, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/DBPedia.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/DBPedia.json new file mode 100644 index 000000000..9321637be --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/DBPedia.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "c0f706b76e590d620bd6618b3ca8efdd34e2d659", + "task_name": "DBPedia", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.5125, + "ndcg_at_3": 0.46117, + "ndcg_at_5": 0.45765, + "ndcg_at_10": 0.45952, + "ndcg_at_20": 0.46581, + "ndcg_at_100": 0.5203, + "ndcg_at_1000": 0.58342, + "map_at_1": 0.09453, + "map_at_3": 0.16844, + "map_at_5": 0.20347, + "map_at_10": 0.24937, + "map_at_20": 0.28821, + "map_at_100": 0.34111, + "map_at_1000": 0.35679, + "recall_at_1": 0.09453, + "recall_at_3": 0.19532, + "recall_at_5": 0.25333, + "recall_at_10": 0.34424, + "recall_at_20": 0.43104, + "recall_at_100": 0.6221, + "recall_at_1000": 0.81244, + "precision_at_1": 0.635, + "precision_at_3": 0.5075, + "precision_at_5": 0.4475, + "precision_at_10": 0.36225, + "precision_at_20": 0.27725, + "precision_at_100": 0.11262, + "precision_at_1000": 0.02199, + "mrr_at_1": 0.635, + "mrr_at_3": 0.73375, + "mrr_at_5": 0.746625, + "mrr_at_10": 0.75247, + "mrr_at_20": 0.754075, + "mrr_at_100": 0.754639, + "mrr_at_1000": 0.754639, + "nauc_ndcg_at_1_max": 0.210131, + "nauc_ndcg_at_1_std": 0.103849, + "nauc_ndcg_at_1_diff1": 0.333165, + "nauc_ndcg_at_3_max": 0.185702, + "nauc_ndcg_at_3_std": 0.150563, + "nauc_ndcg_at_3_diff1": 0.206632, + "nauc_ndcg_at_5_max": 0.163034, + "nauc_ndcg_at_5_std": 0.157567, + "nauc_ndcg_at_5_diff1": 0.199809, + "nauc_ndcg_at_10_max": 0.126654, + "nauc_ndcg_at_10_std": 0.166865, + "nauc_ndcg_at_10_diff1": 0.194365, + "nauc_ndcg_at_20_max": 0.110974, + "nauc_ndcg_at_20_std": 0.160916, + "nauc_ndcg_at_20_diff1": 0.186814, + "nauc_ndcg_at_100_max": 0.154099, + "nauc_ndcg_at_100_std": 0.263879, + "nauc_ndcg_at_100_diff1": 0.157108, + "nauc_ndcg_at_1000_max": 0.219348, + "nauc_ndcg_at_1000_std": 0.337455, + "nauc_ndcg_at_1000_diff1": 0.156546, + "nauc_map_at_1_max": -0.100584, + "nauc_map_at_1_std": -0.1619, + "nauc_map_at_1_diff1": 0.322461, + "nauc_map_at_3_max": -0.137729, + "nauc_map_at_3_std": -0.135015, + "nauc_map_at_3_diff1": 0.183988, + "nauc_map_at_5_max": -0.117228, + "nauc_map_at_5_std": -0.105962, + "nauc_map_at_5_diff1": 0.177706, + "nauc_map_at_10_max": -0.080693, + "nauc_map_at_10_std": -0.048192, + "nauc_map_at_10_diff1": 0.180641, + "nauc_map_at_20_max": -0.015158, + "nauc_map_at_20_std": 0.033816, + "nauc_map_at_20_diff1": 0.163492, + "nauc_map_at_100_max": 0.072763, + "nauc_map_at_100_std": 0.188986, + "nauc_map_at_100_diff1": 0.129989, + "nauc_map_at_1000_max": 0.085902, + "nauc_map_at_1000_std": 0.210202, + "nauc_map_at_1000_diff1": 0.124698, + "nauc_recall_at_1_max": -0.100584, + "nauc_recall_at_1_std": -0.1619, + "nauc_recall_at_1_diff1": 0.322461, + "nauc_recall_at_3_max": -0.165702, + "nauc_recall_at_3_std": -0.152059, + "nauc_recall_at_3_diff1": 0.141483, + "nauc_recall_at_5_max": -0.16198, + "nauc_recall_at_5_std": -0.139922, + "nauc_recall_at_5_diff1": 0.134532, + "nauc_recall_at_10_max": -0.143509, + "nauc_recall_at_10_std": -0.101176, + "nauc_recall_at_10_diff1": 0.139886, + "nauc_recall_at_20_max": -0.076644, + "nauc_recall_at_20_std": -0.022018, + "nauc_recall_at_20_diff1": 0.116341, + "nauc_recall_at_100_max": 0.057929, + "nauc_recall_at_100_std": 0.255353, + "nauc_recall_at_100_diff1": 0.065409, + "nauc_recall_at_1000_max": 0.206072, + "nauc_recall_at_1000_std": 0.448856, + "nauc_recall_at_1000_diff1": 0.045232, + "nauc_precision_at_1_max": 0.267566, + "nauc_precision_at_1_std": 0.153229, + "nauc_precision_at_1_diff1": 0.339709, + "nauc_precision_at_3_max": 0.254927, + "nauc_precision_at_3_std": 0.306668, + "nauc_precision_at_3_diff1": 0.034519, + "nauc_precision_at_5_max": 0.291918, + "nauc_precision_at_5_std": 0.375282, + "nauc_precision_at_5_diff1": 0.00996, + "nauc_precision_at_10_max": 0.327042, + "nauc_precision_at_10_std": 0.451096, + "nauc_precision_at_10_diff1": -0.015845, + "nauc_precision_at_20_max": 0.366269, + "nauc_precision_at_20_std": 0.499877, + "nauc_precision_at_20_diff1": -0.073597, + "nauc_precision_at_100_max": 0.286934, + "nauc_precision_at_100_std": 0.465647, + "nauc_precision_at_100_diff1": -0.122697, + "nauc_precision_at_1000_max": 0.080647, + "nauc_precision_at_1000_std": 0.080925, + "nauc_precision_at_1000_diff1": -0.095957, + "nauc_mrr_at_1_max": 0.267566, + "nauc_mrr_at_1_std": 0.153229, + "nauc_mrr_at_1_diff1": 0.339709, + "nauc_mrr_at_3_max": 0.291013, + "nauc_mrr_at_3_std": 0.197993, + "nauc_mrr_at_3_diff1": 0.341815, + "nauc_mrr_at_5_max": 0.289818, + "nauc_mrr_at_5_std": 0.198785, + "nauc_mrr_at_5_diff1": 0.343001, + "nauc_mrr_at_10_max": 0.290554, + "nauc_mrr_at_10_std": 0.196114, + "nauc_mrr_at_10_diff1": 0.344422, + "nauc_mrr_at_20_max": 0.290136, + "nauc_mrr_at_20_std": 0.195651, + "nauc_mrr_at_20_diff1": 0.343542, + "nauc_mrr_at_100_max": 0.289819, + "nauc_mrr_at_100_std": 0.19436, + "nauc_mrr_at_100_diff1": 0.343563, + "nauc_mrr_at_1000_max": 0.289819, + "nauc_mrr_at_1000_std": 0.19436, + "nauc_mrr_at_1000_diff1": 0.343563, + "main_score": 0.45952, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 2212.5279500484467, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/FEVER.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/FEVER.json new file mode 100644 index 000000000..a36fe06dc --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/FEVER.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "bea83ef9e8fb933d90a2f1d5515737465d613e12", + "task_name": "FEVER", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.64971, + "ndcg_at_3": 0.76339, + "ndcg_at_5": 0.78592, + "ndcg_at_10": 0.79843, + "ndcg_at_20": 0.80347, + "ndcg_at_100": 0.80944, + "ndcg_at_1000": 0.81189, + "map_at_1": 0.60304, + "map_at_3": 0.71823, + "map_at_5": 0.73239, + "map_at_10": 0.73887, + "map_at_20": 0.7407, + "map_at_100": 0.74198, + "map_at_1000": 0.74214, + "recall_at_1": 0.60304, + "recall_at_3": 0.8459, + "recall_at_5": 0.90085, + "recall_at_10": 0.93723, + "recall_at_20": 0.95459, + "recall_at_100": 0.98034, + "recall_at_1000": 0.99469, + "precision_at_1": 0.64971, + "precision_at_3": 0.30758, + "precision_at_5": 0.19808, + "precision_at_10": 0.10405, + "precision_at_20": 0.05353, + "precision_at_100": 0.01127, + "precision_at_1000": 0.00117, + "mrr_at_1": 0.649715, + "mrr_at_3": 0.764201, + "mrr_at_5": 0.776158, + "mrr_at_10": 0.780222, + "mrr_at_20": 0.780992, + "mrr_at_100": 0.781224, + "mrr_at_1000": 0.781231, + "nauc_ndcg_at_1_max": 0.034269, + "nauc_ndcg_at_1_std": -0.194035, + "nauc_ndcg_at_1_diff1": 0.48387, + "nauc_ndcg_at_3_max": 0.049909, + "nauc_ndcg_at_3_std": -0.206574, + "nauc_ndcg_at_3_diff1": 0.375689, + "nauc_ndcg_at_5_max": 0.047035, + "nauc_ndcg_at_5_std": -0.20274, + "nauc_ndcg_at_5_diff1": 0.380833, + "nauc_ndcg_at_10_max": 0.042664, + "nauc_ndcg_at_10_std": -0.193904, + "nauc_ndcg_at_10_diff1": 0.386074, + "nauc_ndcg_at_20_max": 0.042626, + "nauc_ndcg_at_20_std": -0.192143, + "nauc_ndcg_at_20_diff1": 0.39121, + "nauc_ndcg_at_100_max": 0.04204, + "nauc_ndcg_at_100_std": -0.194447, + "nauc_ndcg_at_100_diff1": 0.399626, + "nauc_ndcg_at_1000_max": 0.045182, + "nauc_ndcg_at_1000_std": -0.194255, + "nauc_ndcg_at_1000_diff1": 0.403835, + "nauc_map_at_1_max": 0.031858, + "nauc_map_at_1_std": -0.169635, + "nauc_map_at_1_diff1": 0.427125, + "nauc_map_at_3_max": 0.040809, + "nauc_map_at_3_std": -0.190705, + "nauc_map_at_3_diff1": 0.381241, + "nauc_map_at_5_max": 0.041032, + "nauc_map_at_5_std": -0.189282, + "nauc_map_at_5_diff1": 0.386423, + "nauc_map_at_10_max": 0.039416, + "nauc_map_at_10_std": -0.187215, + "nauc_map_at_10_diff1": 0.389467, + "nauc_map_at_20_max": 0.03974, + "nauc_map_at_20_std": -0.187124, + "nauc_map_at_20_diff1": 0.391099, + "nauc_map_at_100_max": 0.039825, + "nauc_map_at_100_std": -0.187343, + "nauc_map_at_100_diff1": 0.39257, + "nauc_map_at_1000_max": 0.040031, + "nauc_map_at_1000_std": -0.187299, + "nauc_map_at_1000_diff1": 0.39281, + "nauc_recall_at_1_max": 0.031858, + "nauc_recall_at_1_std": -0.169635, + "nauc_recall_at_1_diff1": 0.427125, + "nauc_recall_at_3_max": 0.050239, + "nauc_recall_at_3_std": -0.213586, + "nauc_recall_at_3_diff1": 0.236461, + "nauc_recall_at_5_max": 0.052418, + "nauc_recall_at_5_std": -0.19491, + "nauc_recall_at_5_diff1": 0.191993, + "nauc_recall_at_10_max": 0.037552, + "nauc_recall_at_10_std": -0.115126, + "nauc_recall_at_10_diff1": 0.140759, + "nauc_recall_at_20_max": 0.024684, + "nauc_recall_at_20_std": -0.067357, + "nauc_recall_at_20_diff1": 0.122255, + "nauc_recall_at_100_max": -0.060509, + "nauc_recall_at_100_std": -0.046875, + "nauc_recall_at_100_diff1": 0.118546, + "nauc_recall_at_1000_max": 0.103763, + "nauc_recall_at_1000_std": 0.243673, + "nauc_recall_at_1000_diff1": 0.187434, + "nauc_precision_at_1_max": 0.034269, + "nauc_precision_at_1_std": -0.194035, + "nauc_precision_at_1_diff1": 0.48387, + "nauc_precision_at_3_max": 0.071052, + "nauc_precision_at_3_std": -0.240418, + "nauc_precision_at_3_diff1": 0.241946, + "nauc_precision_at_5_max": 0.066781, + "nauc_precision_at_5_std": -0.178724, + "nauc_precision_at_5_diff1": 0.135294, + "nauc_precision_at_10_max": 0.032337, + "nauc_precision_at_10_std": -0.079599, + "nauc_precision_at_10_diff1": 0.038115, + "nauc_precision_at_20_max": 0.036168, + "nauc_precision_at_20_std": -0.030444, + "nauc_precision_at_20_diff1": -0.003655, + "nauc_precision_at_100_max": 0.043129, + "nauc_precision_at_100_std": 0.011075, + "nauc_precision_at_100_diff1": -0.018538, + "nauc_precision_at_1000_max": 0.071933, + "nauc_precision_at_1000_std": 0.039, + "nauc_precision_at_1000_diff1": -0.020946, + "nauc_mrr_at_1_max": 0.034269, + "nauc_mrr_at_1_std": -0.194035, + "nauc_mrr_at_1_diff1": 0.48387, + "nauc_mrr_at_3_max": 0.051199, + "nauc_mrr_at_3_std": -0.226081, + "nauc_mrr_at_3_diff1": 0.44388, + "nauc_mrr_at_5_max": 0.050266, + "nauc_mrr_at_5_std": -0.223777, + "nauc_mrr_at_5_diff1": 0.44984, + "nauc_mrr_at_10_max": 0.05085, + "nauc_mrr_at_10_std": -0.218628, + "nauc_mrr_at_10_diff1": 0.452458, + "nauc_mrr_at_20_max": 0.050645, + "nauc_mrr_at_20_std": -0.217544, + "nauc_mrr_at_20_diff1": 0.453429, + "nauc_mrr_at_100_max": 0.050241, + "nauc_mrr_at_100_std": -0.217564, + "nauc_mrr_at_100_diff1": 0.453684, + "nauc_mrr_at_1000_max": 0.050223, + "nauc_mrr_at_1000_std": -0.217579, + "nauc_mrr_at_1000_diff1": 0.45369, + "main_score": 0.79843, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 4604.700364589691, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/FiQA2018.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/FiQA2018.json new file mode 100644 index 000000000..010097986 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/FiQA2018.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "27a168819829fe9bcd655c2df245fb19452e8e06", + "task_name": "FiQA2018", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.54167, + "ndcg_at_3": 0.55344, + "ndcg_at_5": 0.5882, + "ndcg_at_10": 0.63086, + "ndcg_at_20": 0.66023, + "ndcg_at_100": 0.6917, + "ndcg_at_1000": 0.69989, + "map_at_1": 0.31193, + "map_at_3": 0.45298, + "map_at_5": 0.49686, + "map_at_10": 0.52873, + "map_at_20": 0.54262, + "map_at_100": 0.55205, + "map_at_1000": 0.55289, + "recall_at_1": 0.31193, + "recall_at_3": 0.53394, + "recall_at_5": 0.64493, + "recall_at_10": 0.76252, + "recall_at_20": 0.84685, + "recall_at_100": 0.95554, + "recall_at_1000": 0.99407, + "precision_at_1": 0.54167, + "precision_at_3": 0.35545, + "precision_at_5": 0.26914, + "precision_at_10": 0.16898, + "precision_at_20": 0.09776, + "precision_at_100": 0.02392, + "precision_at_1000": 0.00259, + "mrr_at_1": 0.541667, + "mrr_at_3": 0.646348, + "mrr_at_5": 0.665021, + "mrr_at_10": 0.675698, + "mrr_at_20": 0.67844, + "mrr_at_100": 0.679211, + "mrr_at_1000": 0.67923, + "nauc_ndcg_at_1_max": 0.122109, + "nauc_ndcg_at_1_std": -0.317356, + "nauc_ndcg_at_1_diff1": 0.419017, + "nauc_ndcg_at_3_max": 0.101633, + "nauc_ndcg_at_3_std": -0.33682, + "nauc_ndcg_at_3_diff1": 0.336417, + "nauc_ndcg_at_5_max": 0.080599, + "nauc_ndcg_at_5_std": -0.325139, + "nauc_ndcg_at_5_diff1": 0.325964, + "nauc_ndcg_at_10_max": 0.072882, + "nauc_ndcg_at_10_std": -0.338687, + "nauc_ndcg_at_10_diff1": 0.332154, + "nauc_ndcg_at_20_max": 0.073949, + "nauc_ndcg_at_20_std": -0.326919, + "nauc_ndcg_at_20_diff1": 0.317519, + "nauc_ndcg_at_100_max": 0.099184, + "nauc_ndcg_at_100_std": -0.320644, + "nauc_ndcg_at_100_diff1": 0.337488, + "nauc_ndcg_at_1000_max": 0.103094, + "nauc_ndcg_at_1000_std": -0.321147, + "nauc_ndcg_at_1000_diff1": 0.341969, + "nauc_map_at_1_max": -0.030107, + "nauc_map_at_1_std": -0.266508, + "nauc_map_at_1_diff1": 0.338975, + "nauc_map_at_3_max": 0.031552, + "nauc_map_at_3_std": -0.319473, + "nauc_map_at_3_diff1": 0.313387, + "nauc_map_at_5_max": 0.047302, + "nauc_map_at_5_std": -0.3114, + "nauc_map_at_5_diff1": 0.309251, + "nauc_map_at_10_max": 0.05638, + "nauc_map_at_10_std": -0.323738, + "nauc_map_at_10_diff1": 0.314471, + "nauc_map_at_20_max": 0.059587, + "nauc_map_at_20_std": -0.318795, + "nauc_map_at_20_diff1": 0.309614, + "nauc_map_at_100_max": 0.066604, + "nauc_map_at_100_std": -0.318765, + "nauc_map_at_100_diff1": 0.314401, + "nauc_map_at_1000_max": 0.067083, + "nauc_map_at_1000_std": -0.318681, + "nauc_map_at_1000_diff1": 0.31474, + "nauc_recall_at_1_max": -0.030107, + "nauc_recall_at_1_std": -0.266508, + "nauc_recall_at_1_diff1": 0.338975, + "nauc_recall_at_3_max": 0.014384, + "nauc_recall_at_3_std": -0.323045, + "nauc_recall_at_3_diff1": 0.269999, + "nauc_recall_at_5_max": 0.010358, + "nauc_recall_at_5_std": -0.28041, + "nauc_recall_at_5_diff1": 0.232752, + "nauc_recall_at_10_max": -0.030262, + "nauc_recall_at_10_std": -0.326461, + "nauc_recall_at_10_diff1": 0.223933, + "nauc_recall_at_20_max": -0.071337, + "nauc_recall_at_20_std": -0.271433, + "nauc_recall_at_20_diff1": 0.115759, + "nauc_recall_at_100_max": -0.022998, + "nauc_recall_at_100_std": -0.165209, + "nauc_recall_at_100_diff1": 0.112631, + "nauc_recall_at_1000_max": -0.292067, + "nauc_recall_at_1000_std": -0.073503, + "nauc_recall_at_1000_diff1": -0.009715, + "nauc_precision_at_1_max": 0.122109, + "nauc_precision_at_1_std": -0.317356, + "nauc_precision_at_1_diff1": 0.419017, + "nauc_precision_at_3_max": 0.230145, + "nauc_precision_at_3_std": -0.223989, + "nauc_precision_at_3_diff1": 0.16934, + "nauc_precision_at_5_max": 0.236951, + "nauc_precision_at_5_std": -0.134354, + "nauc_precision_at_5_diff1": 0.10193, + "nauc_precision_at_10_max": 0.254857, + "nauc_precision_at_10_std": -0.063523, + "nauc_precision_at_10_diff1": 0.0404, + "nauc_precision_at_20_max": 0.226013, + "nauc_precision_at_20_std": 0.01759, + "nauc_precision_at_20_diff1": -0.043433, + "nauc_precision_at_100_max": 0.224575, + "nauc_precision_at_100_std": 0.100913, + "nauc_precision_at_100_diff1": -0.062307, + "nauc_precision_at_1000_max": 0.200853, + "nauc_precision_at_1000_std": 0.111835, + "nauc_precision_at_1000_diff1": -0.068931, + "nauc_mrr_at_1_max": 0.122109, + "nauc_mrr_at_1_std": -0.317356, + "nauc_mrr_at_1_diff1": 0.419017, + "nauc_mrr_at_3_max": 0.15, + "nauc_mrr_at_3_std": -0.343552, + "nauc_mrr_at_3_diff1": 0.411483, + "nauc_mrr_at_5_max": 0.142617, + "nauc_mrr_at_5_std": -0.341001, + "nauc_mrr_at_5_diff1": 0.409497, + "nauc_mrr_at_10_max": 0.14561, + "nauc_mrr_at_10_std": -0.338259, + "nauc_mrr_at_10_diff1": 0.412069, + "nauc_mrr_at_20_max": 0.143819, + "nauc_mrr_at_20_std": -0.337132, + "nauc_mrr_at_20_diff1": 0.410192, + "nauc_mrr_at_100_max": 0.144192, + "nauc_mrr_at_100_std": -0.337012, + "nauc_mrr_at_100_diff1": 0.411116, + "nauc_mrr_at_1000_max": 0.144156, + "nauc_mrr_at_1000_std": -0.337052, + "nauc_mrr_at_1000_diff1": 0.411088, + "main_score": 0.63086, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 72.56935358047485, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/HotpotQA.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/HotpotQA.json new file mode 100644 index 000000000..e2759111d --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/HotpotQA.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "ab518f4d6fcca38d87c25209f94beba119d02014", + "task_name": "HotpotQA", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.69196, + "ndcg_at_3": 0.60998, + "ndcg_at_5": 0.65429, + "ndcg_at_10": 0.68912, + "ndcg_at_20": 0.71055, + "ndcg_at_100": 0.73374, + "ndcg_at_1000": 0.74093, + "map_at_1": 0.34598, + "map_at_3": 0.53859, + "map_at_5": 0.57289, + "map_at_10": 0.594, + "map_at_20": 0.60289, + "map_at_100": 0.60786, + "map_at_1000": 0.6083, + "recall_at_1": 0.34598, + "recall_at_3": 0.60311, + "recall_at_5": 0.69061, + "recall_at_10": 0.77772, + "recall_at_20": 0.84652, + "recall_at_100": 0.94774, + "recall_at_1000": 0.99338, + "precision_at_1": 0.69196, + "precision_at_3": 0.40207, + "precision_at_5": 0.27625, + "precision_at_10": 0.15554, + "precision_at_20": 0.08465, + "precision_at_100": 0.01895, + "precision_at_1000": 0.00199, + "mrr_at_1": 0.691965, + "mrr_at_3": 0.766036, + "mrr_at_5": 0.77786, + "mrr_at_10": 0.78307, + "mrr_at_20": 0.784652, + "mrr_at_100": 0.785348, + "mrr_at_1000": 0.785385, + "nauc_ndcg_at_1_max": 0.241659, + "nauc_ndcg_at_1_std": -0.264533, + "nauc_ndcg_at_1_diff1": 0.590718, + "nauc_ndcg_at_3_max": 0.112863, + "nauc_ndcg_at_3_std": -0.22173, + "nauc_ndcg_at_3_diff1": 0.309108, + "nauc_ndcg_at_5_max": 0.10377, + "nauc_ndcg_at_5_std": -0.215166, + "nauc_ndcg_at_5_diff1": 0.302285, + "nauc_ndcg_at_10_max": 0.102068, + "nauc_ndcg_at_10_std": -0.214173, + "nauc_ndcg_at_10_diff1": 0.312935, + "nauc_ndcg_at_20_max": 0.104051, + "nauc_ndcg_at_20_std": -0.209474, + "nauc_ndcg_at_20_diff1": 0.320327, + "nauc_ndcg_at_100_max": 0.113058, + "nauc_ndcg_at_100_std": -0.20382, + "nauc_ndcg_at_100_diff1": 0.335762, + "nauc_ndcg_at_1000_max": 0.118616, + "nauc_ndcg_at_1000_std": -0.211607, + "nauc_ndcg_at_1000_diff1": 0.342195, + "nauc_map_at_1_max": 0.241659, + "nauc_map_at_1_std": -0.264533, + "nauc_map_at_1_diff1": 0.590718, + "nauc_map_at_3_max": 0.096989, + "nauc_map_at_3_std": -0.203508, + "nauc_map_at_3_diff1": 0.267485, + "nauc_map_at_5_max": 0.092303, + "nauc_map_at_5_std": -0.201524, + "nauc_map_at_5_diff1": 0.266436, + "nauc_map_at_10_max": 0.092174, + "nauc_map_at_10_std": -0.20211, + "nauc_map_at_10_diff1": 0.273869, + "nauc_map_at_20_max": 0.093061, + "nauc_map_at_20_std": -0.200359, + "nauc_map_at_20_diff1": 0.276655, + "nauc_map_at_100_max": 0.094177, + "nauc_map_at_100_std": -0.199461, + "nauc_map_at_100_diff1": 0.278949, + "nauc_map_at_1000_max": 0.094417, + "nauc_map_at_1000_std": -0.199718, + "nauc_map_at_1000_diff1": 0.279145, + "nauc_recall_at_1_max": 0.241659, + "nauc_recall_at_1_std": -0.264533, + "nauc_recall_at_1_diff1": 0.590718, + "nauc_recall_at_3_max": 0.060389, + "nauc_recall_at_3_std": -0.200619, + "nauc_recall_at_3_diff1": 0.200745, + "nauc_recall_at_5_max": 0.031515, + "nauc_recall_at_5_std": -0.176226, + "nauc_recall_at_5_diff1": 0.162594, + "nauc_recall_at_10_max": 0.008219, + "nauc_recall_at_10_std": -0.158022, + "nauc_recall_at_10_diff1": 0.15408, + "nauc_recall_at_20_max": -0.012222, + "nauc_recall_at_20_std": -0.11861, + "nauc_recall_at_20_diff1": 0.136513, + "nauc_recall_at_100_max": -0.038647, + "nauc_recall_at_100_std": 0.072623, + "nauc_recall_at_100_diff1": 0.124383, + "nauc_recall_at_1000_max": -0.039118, + "nauc_recall_at_1000_std": 0.386005, + "nauc_recall_at_1000_diff1": 0.142687, + "nauc_precision_at_1_max": 0.241659, + "nauc_precision_at_1_std": -0.264533, + "nauc_precision_at_1_diff1": 0.590718, + "nauc_precision_at_3_max": 0.060389, + "nauc_precision_at_3_std": -0.200619, + "nauc_precision_at_3_diff1": 0.200745, + "nauc_precision_at_5_max": 0.031515, + "nauc_precision_at_5_std": -0.176226, + "nauc_precision_at_5_diff1": 0.162594, + "nauc_precision_at_10_max": 0.008219, + "nauc_precision_at_10_std": -0.158022, + "nauc_precision_at_10_diff1": 0.15408, + "nauc_precision_at_20_max": -0.012222, + "nauc_precision_at_20_std": -0.11861, + "nauc_precision_at_20_diff1": 0.136513, + "nauc_precision_at_100_max": -0.038647, + "nauc_precision_at_100_std": 0.072623, + "nauc_precision_at_100_diff1": 0.124383, + "nauc_precision_at_1000_max": -0.039118, + "nauc_precision_at_1000_std": 0.386005, + "nauc_precision_at_1000_diff1": 0.142687, + "nauc_mrr_at_1_max": 0.241659, + "nauc_mrr_at_1_std": -0.264533, + "nauc_mrr_at_1_diff1": 0.590718, + "nauc_mrr_at_3_max": 0.233018, + "nauc_mrr_at_3_std": -0.290832, + "nauc_mrr_at_3_diff1": 0.577306, + "nauc_mrr_at_5_max": 0.231946, + "nauc_mrr_at_5_std": -0.284815, + "nauc_mrr_at_5_diff1": 0.577632, + "nauc_mrr_at_10_max": 0.231863, + "nauc_mrr_at_10_std": -0.283692, + "nauc_mrr_at_10_diff1": 0.578899, + "nauc_mrr_at_20_max": 0.231674, + "nauc_mrr_at_20_std": -0.283935, + "nauc_mrr_at_20_diff1": 0.579121, + "nauc_mrr_at_100_max": 0.23202, + "nauc_mrr_at_100_std": -0.283269, + "nauc_mrr_at_100_diff1": 0.57921, + "nauc_mrr_at_1000_max": 0.232029, + "nauc_mrr_at_1000_std": -0.283322, + "nauc_mrr_at_1000_diff1": 0.579202, + "main_score": 0.68912, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 2875.7968850135803, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/MSMARCO.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/MSMARCO.json new file mode 100644 index 000000000..22c600596 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/MSMARCO.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "c5a29a104738b98a9e76336939199e264163d4a0", + "task_name": "MSMARCO", + "mteb_version": "1.29.16", + "scores": { + "dev": [ + { + "ndcg_at_1": 0.17092, + "ndcg_at_3": 0.27091, + "ndcg_at_5": 0.31214, + "ndcg_at_10": 0.35313, + "ndcg_at_20": 0.38241, + "ndcg_at_100": 0.42179, + "ndcg_at_1000": 0.43594, + "map_at_1": 0.16605, + "map_at_3": 0.24386, + "map_at_5": 0.26677, + "map_at_10": 0.28395, + "map_at_20": 0.29225, + "map_at_100": 0.29792, + "map_at_1000": 0.29852, + "recall_at_1": 0.16605, + "recall_at_3": 0.3434, + "recall_at_5": 0.44292, + "recall_at_10": 0.56809, + "recall_at_20": 0.68132, + "recall_at_100": 0.88872, + "recall_at_1000": 0.99457, + "precision_at_1": 0.17092, + "precision_at_3": 0.11848, + "precision_at_5": 0.09186, + "precision_at_10": 0.05905, + "precision_at_20": 0.03559, + "precision_at_100": 0.00937, + "precision_at_1000": 0.00106, + "mrr_at_1": 0.17063, + "mrr_at_3": 0.249594, + "mrr_at_5": 0.27256, + "mrr_at_10": 0.289353, + "mrr_at_20": 0.297355, + "mrr_at_100": 0.302695, + "mrr_at_1000": 0.303215, + "nauc_ndcg_at_1_max": 0.055625, + "nauc_ndcg_at_1_std": -0.161092, + "nauc_ndcg_at_1_diff1": 0.330972, + "nauc_ndcg_at_3_max": 0.047403, + "nauc_ndcg_at_3_std": -0.198369, + "nauc_ndcg_at_3_diff1": 0.298802, + "nauc_ndcg_at_5_max": 0.042091, + "nauc_ndcg_at_5_std": -0.215124, + "nauc_ndcg_at_5_diff1": 0.296259, + "nauc_ndcg_at_10_max": 0.03827, + "nauc_ndcg_at_10_std": -0.226255, + "nauc_ndcg_at_10_diff1": 0.30363, + "nauc_ndcg_at_20_max": 0.044104, + "nauc_ndcg_at_20_std": -0.214959, + "nauc_ndcg_at_20_diff1": 0.305112, + "nauc_ndcg_at_100_max": 0.044742, + "nauc_ndcg_at_100_std": -0.1941, + "nauc_ndcg_at_100_diff1": 0.307561, + "nauc_ndcg_at_1000_max": 0.044949, + "nauc_ndcg_at_1000_std": -0.199946, + "nauc_ndcg_at_1000_diff1": 0.305748, + "nauc_map_at_1_max": 0.054489, + "nauc_map_at_1_std": -0.164293, + "nauc_map_at_1_diff1": 0.335354, + "nauc_map_at_3_max": 0.048325, + "nauc_map_at_3_std": -0.192464, + "nauc_map_at_3_diff1": 0.306301, + "nauc_map_at_5_max": 0.045377, + "nauc_map_at_5_std": -0.202064, + "nauc_map_at_5_diff1": 0.30474, + "nauc_map_at_10_max": 0.043458, + "nauc_map_at_10_std": -0.206956, + "nauc_map_at_10_diff1": 0.307709, + "nauc_map_at_20_max": 0.044922, + "nauc_map_at_20_std": -0.203867, + "nauc_map_at_20_diff1": 0.307909, + "nauc_map_at_100_max": 0.045049, + "nauc_map_at_100_std": -0.201129, + "nauc_map_at_100_diff1": 0.308317, + "nauc_map_at_1000_max": 0.045051, + "nauc_map_at_1000_std": -0.201204, + "nauc_map_at_1000_diff1": 0.308252, + "nauc_recall_at_1_max": 0.054489, + "nauc_recall_at_1_std": -0.164293, + "nauc_recall_at_1_diff1": 0.335354, + "nauc_recall_at_3_max": 0.044441, + "nauc_recall_at_3_std": -0.214455, + "nauc_recall_at_3_diff1": 0.280922, + "nauc_recall_at_5_max": 0.032275, + "nauc_recall_at_5_std": -0.2497, + "nauc_recall_at_5_diff1": 0.275113, + "nauc_recall_at_10_max": 0.021541, + "nauc_recall_at_10_std": -0.284326, + "nauc_recall_at_10_diff1": 0.294637, + "nauc_recall_at_20_max": 0.04297, + "nauc_recall_at_20_std": -0.248016, + "nauc_recall_at_20_diff1": 0.301545, + "nauc_recall_at_100_max": 0.046029, + "nauc_recall_at_100_std": -0.03588, + "nauc_recall_at_100_diff1": 0.332717, + "nauc_recall_at_1000_max": 0.181391, + "nauc_recall_at_1000_std": 0.572858, + "nauc_recall_at_1000_diff1": 0.317908, + "nauc_precision_at_1_max": 0.055625, + "nauc_precision_at_1_std": -0.161092, + "nauc_precision_at_1_diff1": 0.330972, + "nauc_precision_at_3_max": 0.045372, + "nauc_precision_at_3_std": -0.211767, + "nauc_precision_at_3_diff1": 0.276677, + "nauc_precision_at_5_max": 0.032967, + "nauc_precision_at_5_std": -0.246539, + "nauc_precision_at_5_diff1": 0.269662, + "nauc_precision_at_10_max": 0.02156, + "nauc_precision_at_10_std": -0.274984, + "nauc_precision_at_10_diff1": 0.280481, + "nauc_precision_at_20_max": 0.040815, + "nauc_precision_at_20_std": -0.225257, + "nauc_precision_at_20_diff1": 0.269001, + "nauc_precision_at_100_max": 0.055682, + "nauc_precision_at_100_std": 0.013893, + "nauc_precision_at_100_diff1": 0.17996, + "nauc_precision_at_1000_max": 0.048195, + "nauc_precision_at_1000_std": 0.093265, + "nauc_precision_at_1000_diff1": -0.06713, + "nauc_mrr_at_1_max": 0.056088, + "nauc_mrr_at_1_std": -0.161541, + "nauc_mrr_at_1_diff1": 0.332522, + "nauc_mrr_at_3_max": 0.049326, + "nauc_mrr_at_3_std": -0.187856, + "nauc_mrr_at_3_diff1": 0.303096, + "nauc_mrr_at_5_max": 0.046605, + "nauc_mrr_at_5_std": -0.197372, + "nauc_mrr_at_5_diff1": 0.3015, + "nauc_mrr_at_10_max": 0.044956, + "nauc_mrr_at_10_std": -0.201454, + "nauc_mrr_at_10_diff1": 0.304942, + "nauc_mrr_at_20_max": 0.046911, + "nauc_mrr_at_20_std": -0.198126, + "nauc_mrr_at_20_diff1": 0.305219, + "nauc_mrr_at_100_max": 0.046719, + "nauc_mrr_at_100_std": -0.195834, + "nauc_mrr_at_100_diff1": 0.305768, + "nauc_mrr_at_1000_max": 0.046695, + "nauc_mrr_at_1000_std": -0.195944, + "nauc_mrr_at_1000_diff1": 0.305715, + "main_score": 0.35313, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 5563.747529506683, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/NFCorpus.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/NFCorpus.json new file mode 100644 index 000000000..3de9a3a96 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/NFCorpus.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "ec0fa4fe99da2ff19ca1214b7966684033a58814", + "task_name": "NFCorpus", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.61146, + "ndcg_at_3": 0.57554, + "ndcg_at_5": 0.55511, + "ndcg_at_10": 0.54248, + "ndcg_at_20": 0.5295, + "ndcg_at_100": 0.53599, + "ndcg_at_1000": 0.62104, + "map_at_1": 0.13059, + "map_at_3": 0.21599, + "map_at_5": 0.24643, + "map_at_10": 0.28891, + "map_at_20": 0.32094, + "map_at_100": 0.35371, + "map_at_1000": 0.37102, + "recall_at_1": 0.13059, + "recall_at_3": 0.23792, + "recall_at_5": 0.28785, + "recall_at_10": 0.36309, + "recall_at_20": 0.43784, + "recall_at_100": 0.58439, + "recall_at_1000": 0.83705, + "precision_at_1": 0.65015, + "precision_at_3": 0.52632, + "precision_at_5": 0.45325, + "precision_at_10": 0.36502, + "precision_at_20": 0.26904, + "precision_at_100": 0.10232, + "precision_at_1000": 0.02335, + "mrr_at_1": 0.650155, + "mrr_at_3": 0.737358, + "mrr_at_5": 0.751445, + "mrr_at_10": 0.757691, + "mrr_at_20": 0.758546, + "mrr_at_100": 0.759605, + "mrr_at_1000": 0.759605, + "nauc_ndcg_at_1_max": 0.275483, + "nauc_ndcg_at_1_std": 0.114967, + "nauc_ndcg_at_1_diff1": 0.32276, + "nauc_ndcg_at_3_max": 0.310718, + "nauc_ndcg_at_3_std": 0.187943, + "nauc_ndcg_at_3_diff1": 0.248749, + "nauc_ndcg_at_5_max": 0.316529, + "nauc_ndcg_at_5_std": 0.211495, + "nauc_ndcg_at_5_diff1": 0.238892, + "nauc_ndcg_at_10_max": 0.305766, + "nauc_ndcg_at_10_std": 0.201106, + "nauc_ndcg_at_10_diff1": 0.22364, + "nauc_ndcg_at_20_max": 0.281943, + "nauc_ndcg_at_20_std": 0.185832, + "nauc_ndcg_at_20_diff1": 0.217053, + "nauc_ndcg_at_100_max": 0.240772, + "nauc_ndcg_at_100_std": 0.14128, + "nauc_ndcg_at_100_diff1": 0.226474, + "nauc_ndcg_at_1000_max": 0.277243, + "nauc_ndcg_at_1000_std": 0.167237, + "nauc_ndcg_at_1000_diff1": 0.250099, + "nauc_map_at_1_max": -0.036005, + "nauc_map_at_1_std": -0.156046, + "nauc_map_at_1_diff1": 0.367597, + "nauc_map_at_3_max": -0.000628, + "nauc_map_at_3_std": -0.156815, + "nauc_map_at_3_diff1": 0.244182, + "nauc_map_at_5_max": 0.035562, + "nauc_map_at_5_std": -0.118991, + "nauc_map_at_5_diff1": 0.233576, + "nauc_map_at_10_max": 0.091683, + "nauc_map_at_10_std": -0.067388, + "nauc_map_at_10_diff1": 0.215456, + "nauc_map_at_20_max": 0.128545, + "nauc_map_at_20_std": -0.008956, + "nauc_map_at_20_diff1": 0.209826, + "nauc_map_at_100_max": 0.162495, + "nauc_map_at_100_std": 0.047455, + "nauc_map_at_100_diff1": 0.211963, + "nauc_map_at_1000_max": 0.175536, + "nauc_map_at_1000_std": 0.06455, + "nauc_map_at_1000_diff1": 0.213043, + "nauc_recall_at_1_max": -0.036005, + "nauc_recall_at_1_std": -0.156046, + "nauc_recall_at_1_diff1": 0.367597, + "nauc_recall_at_3_max": -0.012693, + "nauc_recall_at_3_std": -0.140587, + "nauc_recall_at_3_diff1": 0.213341, + "nauc_recall_at_5_max": 0.0166, + "nauc_recall_at_5_std": -0.095905, + "nauc_recall_at_5_diff1": 0.197508, + "nauc_recall_at_10_max": 0.066817, + "nauc_recall_at_10_std": -0.064965, + "nauc_recall_at_10_diff1": 0.176536, + "nauc_recall_at_20_max": 0.095474, + "nauc_recall_at_20_std": 0.000596, + "nauc_recall_at_20_diff1": 0.167307, + "nauc_recall_at_100_max": 0.115972, + "nauc_recall_at_100_std": 0.077753, + "nauc_recall_at_100_diff1": 0.172739, + "nauc_recall_at_1000_max": 0.162201, + "nauc_recall_at_1000_std": 0.097895, + "nauc_recall_at_1000_diff1": 0.201088, + "nauc_precision_at_1_max": 0.286704, + "nauc_precision_at_1_std": 0.087244, + "nauc_precision_at_1_diff1": 0.317495, + "nauc_precision_at_3_max": 0.351757, + "nauc_precision_at_3_std": 0.254462, + "nauc_precision_at_3_diff1": 0.058175, + "nauc_precision_at_5_max": 0.374192, + "nauc_precision_at_5_std": 0.334879, + "nauc_precision_at_5_diff1": 0.01342, + "nauc_precision_at_10_max": 0.38181, + "nauc_precision_at_10_std": 0.406276, + "nauc_precision_at_10_diff1": -0.032894, + "nauc_precision_at_20_max": 0.355905, + "nauc_precision_at_20_std": 0.458585, + "nauc_precision_at_20_diff1": -0.047402, + "nauc_precision_at_100_max": 0.240057, + "nauc_precision_at_100_std": 0.412188, + "nauc_precision_at_100_diff1": -0.094411, + "nauc_precision_at_1000_max": 0.076183, + "nauc_precision_at_1000_std": 0.189639, + "nauc_precision_at_1000_diff1": -0.115913, + "nauc_mrr_at_1_max": 0.286704, + "nauc_mrr_at_1_std": 0.087244, + "nauc_mrr_at_1_diff1": 0.317495, + "nauc_mrr_at_3_max": 0.339966, + "nauc_mrr_at_3_std": 0.165795, + "nauc_mrr_at_3_diff1": 0.344273, + "nauc_mrr_at_5_max": 0.323694, + "nauc_mrr_at_5_std": 0.151177, + "nauc_mrr_at_5_diff1": 0.33528, + "nauc_mrr_at_10_max": 0.32599, + "nauc_mrr_at_10_std": 0.153064, + "nauc_mrr_at_10_diff1": 0.333536, + "nauc_mrr_at_20_max": 0.324488, + "nauc_mrr_at_20_std": 0.151792, + "nauc_mrr_at_20_diff1": 0.333663, + "nauc_mrr_at_100_max": 0.324718, + "nauc_mrr_at_100_std": 0.149547, + "nauc_mrr_at_100_diff1": 0.333855, + "nauc_mrr_at_1000_max": 0.324718, + "nauc_mrr_at_1000_std": 0.149547, + "nauc_mrr_at_1000_diff1": 0.333855, + "main_score": 0.54248, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 9.501079320907593, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/NQ.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/NQ.json new file mode 100644 index 000000000..f75c941b1 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/NQ.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "b774495ed302d8c44a3a7ea25c90dbce03968f31", + "task_name": "NQ", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.24131, + "ndcg_at_3": 0.34291, + "ndcg_at_5": 0.3874, + "ndcg_at_10": 0.43898, + "ndcg_at_20": 0.47201, + "ndcg_at_100": 0.5055, + "ndcg_at_1000": 0.51068, + "map_at_1": 0.21147, + "map_at_3": 0.3063, + "map_at_5": 0.33192, + "map_at_10": 0.35514, + "map_at_20": 0.36524, + "map_at_100": 0.3707, + "map_at_1000": 0.37098, + "recall_at_1": 0.21147, + "recall_at_3": 0.41983, + "recall_at_5": 0.52284, + "recall_at_10": 0.67292, + "recall_at_20": 0.79621, + "recall_at_100": 0.9636, + "recall_at_1000": 0.99971, + "precision_at_1": 0.24131, + "precision_at_3": 0.16271, + "precision_at_5": 0.123, + "precision_at_10": 0.08033, + "precision_at_20": 0.04786, + "precision_at_100": 0.01168, + "precision_at_1000": 0.00122, + "mrr_at_1": 0.241599, + "mrr_at_3": 0.335603, + "mrr_at_5": 0.360211, + "mrr_at_10": 0.37984, + "mrr_at_20": 0.387792, + "mrr_at_100": 0.391873, + "mrr_at_1000": 0.392043, + "nauc_ndcg_at_1_max": 0.061177, + "nauc_ndcg_at_1_std": -0.127955, + "nauc_ndcg_at_1_diff1": 0.26539, + "nauc_ndcg_at_3_max": 0.057799, + "nauc_ndcg_at_3_std": -0.175117, + "nauc_ndcg_at_3_diff1": 0.225407, + "nauc_ndcg_at_5_max": 0.066116, + "nauc_ndcg_at_5_std": -0.185306, + "nauc_ndcg_at_5_diff1": 0.231721, + "nauc_ndcg_at_10_max": 0.07829, + "nauc_ndcg_at_10_std": -0.183604, + "nauc_ndcg_at_10_diff1": 0.228204, + "nauc_ndcg_at_20_max": 0.082838, + "nauc_ndcg_at_20_std": -0.176642, + "nauc_ndcg_at_20_diff1": 0.231847, + "nauc_ndcg_at_100_max": 0.078262, + "nauc_ndcg_at_100_std": -0.167512, + "nauc_ndcg_at_100_diff1": 0.233122, + "nauc_ndcg_at_1000_max": 0.07453, + "nauc_ndcg_at_1000_std": -0.167469, + "nauc_ndcg_at_1000_diff1": 0.233286, + "nauc_map_at_1_max": 0.041952, + "nauc_map_at_1_std": -0.142862, + "nauc_map_at_1_diff1": 0.266529, + "nauc_map_at_3_max": 0.050855, + "nauc_map_at_3_std": -0.171068, + "nauc_map_at_3_diff1": 0.233414, + "nauc_map_at_5_max": 0.056009, + "nauc_map_at_5_std": -0.177414, + "nauc_map_at_5_diff1": 0.238283, + "nauc_map_at_10_max": 0.062152, + "nauc_map_at_10_std": -0.175015, + "nauc_map_at_10_diff1": 0.236473, + "nauc_map_at_20_max": 0.063356, + "nauc_map_at_20_std": -0.172837, + "nauc_map_at_20_diff1": 0.237342, + "nauc_map_at_100_max": 0.062927, + "nauc_map_at_100_std": -0.171194, + "nauc_map_at_100_diff1": 0.237403, + "nauc_map_at_1000_max": 0.062796, + "nauc_map_at_1000_std": -0.171127, + "nauc_map_at_1000_diff1": 0.237426, + "nauc_recall_at_1_max": 0.041952, + "nauc_recall_at_1_std": -0.142862, + "nauc_recall_at_1_diff1": 0.266529, + "nauc_recall_at_3_max": 0.059579, + "nauc_recall_at_3_std": -0.196857, + "nauc_recall_at_3_diff1": 0.19804, + "nauc_recall_at_5_max": 0.075902, + "nauc_recall_at_5_std": -0.221341, + "nauc_recall_at_5_diff1": 0.209203, + "nauc_recall_at_10_max": 0.115202, + "nauc_recall_at_10_std": -0.232969, + "nauc_recall_at_10_diff1": 0.195654, + "nauc_recall_at_20_max": 0.156148, + "nauc_recall_at_20_std": -0.214551, + "nauc_recall_at_20_diff1": 0.208203, + "nauc_recall_at_100_max": 0.270503, + "nauc_recall_at_100_std": -0.128395, + "nauc_recall_at_100_diff1": 0.215204, + "nauc_recall_at_1000_max": 0.593835, + "nauc_recall_at_1000_std": 0.649867, + "nauc_recall_at_1000_diff1": -0.205901, + "nauc_precision_at_1_max": 0.061177, + "nauc_precision_at_1_std": -0.127955, + "nauc_precision_at_1_diff1": 0.26539, + "nauc_precision_at_3_max": 0.087624, + "nauc_precision_at_3_std": -0.16356, + "nauc_precision_at_3_diff1": 0.187622, + "nauc_precision_at_5_max": 0.108383, + "nauc_precision_at_5_std": -0.161541, + "nauc_precision_at_5_diff1": 0.179799, + "nauc_precision_at_10_max": 0.139711, + "nauc_precision_at_10_std": -0.107442, + "nauc_precision_at_10_diff1": 0.126609, + "nauc_precision_at_20_max": 0.15269, + "nauc_precision_at_20_std": -0.040376, + "nauc_precision_at_20_diff1": 0.081295, + "nauc_precision_at_100_max": 0.124636, + "nauc_precision_at_100_std": 0.095578, + "nauc_precision_at_100_diff1": -0.021733, + "nauc_precision_at_1000_max": 0.090893, + "nauc_precision_at_1000_std": 0.122458, + "nauc_precision_at_1000_diff1": -0.051766, + "nauc_mrr_at_1_max": 0.062758, + "nauc_mrr_at_1_std": -0.128557, + "nauc_mrr_at_1_diff1": 0.264324, + "nauc_mrr_at_3_max": 0.069292, + "nauc_mrr_at_3_std": -0.152565, + "nauc_mrr_at_3_diff1": 0.233456, + "nauc_mrr_at_5_max": 0.072708, + "nauc_mrr_at_5_std": -0.156851, + "nauc_mrr_at_5_diff1": 0.235235, + "nauc_mrr_at_10_max": 0.075187, + "nauc_mrr_at_10_std": -0.156877, + "nauc_mrr_at_10_diff1": 0.234609, + "nauc_mrr_at_20_max": 0.075442, + "nauc_mrr_at_20_std": -0.156254, + "nauc_mrr_at_20_diff1": 0.236153, + "nauc_mrr_at_100_max": 0.074768, + "nauc_mrr_at_100_std": -0.155228, + "nauc_mrr_at_100_diff1": 0.236582, + "nauc_mrr_at_1000_max": 0.074644, + "nauc_mrr_at_1000_std": -0.155241, + "nauc_mrr_at_1000_diff1": 0.236576, + "main_score": 0.43898, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 2121.3226385116577, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/QuoraRetrieval.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/QuoraRetrieval.json new file mode 100644 index 000000000..08e589a14 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/QuoraRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "e4e08e0b7dbe3c8700f0daef558ff32256715259", + "task_name": "QuoraRetrieval", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.8267, + "ndcg_at_3": 0.86918, + "ndcg_at_5": 0.88482, + "ndcg_at_10": 0.8973, + "ndcg_at_20": 0.9034, + "ndcg_at_100": 0.90709, + "ndcg_at_1000": 0.90753, + "map_at_1": 0.71706, + "map_at_3": 0.82996, + "map_at_5": 0.849, + "map_at_10": 0.86028, + "map_at_20": 0.86454, + "map_at_100": 0.86641, + "map_at_1000": 0.86652, + "recall_at_1": 0.71706, + "recall_at_3": 0.88689, + "recall_at_5": 0.93131, + "recall_at_10": 0.96803, + "recall_at_20": 0.98674, + "recall_at_100": 0.99856, + "recall_at_1000": 0.99994, + "precision_at_1": 0.8267, + "precision_at_3": 0.38133, + "precision_at_5": 0.25122, + "precision_at_10": 0.13703, + "precision_at_20": 0.07269, + "precision_at_100": 0.01542, + "precision_at_1000": 0.00157, + "mrr_at_1": 0.8267, + "mrr_at_3": 0.879133, + "mrr_at_5": 0.885548, + "mrr_at_10": 0.888206, + "mrr_at_20": 0.888742, + "mrr_at_100": 0.88885, + "mrr_at_1000": 0.888852, + "nauc_ndcg_at_1_max": 0.332766, + "nauc_ndcg_at_1_std": -0.52977, + "nauc_ndcg_at_1_diff1": 0.764176, + "nauc_ndcg_at_3_max": 0.307057, + "nauc_ndcg_at_3_std": -0.63782, + "nauc_ndcg_at_3_diff1": 0.734488, + "nauc_ndcg_at_5_max": 0.307328, + "nauc_ndcg_at_5_std": -0.657364, + "nauc_ndcg_at_5_diff1": 0.739454, + "nauc_ndcg_at_10_max": 0.310069, + "nauc_ndcg_at_10_std": -0.643153, + "nauc_ndcg_at_10_diff1": 0.742469, + "nauc_ndcg_at_20_max": 0.315709, + "nauc_ndcg_at_20_std": -0.622236, + "nauc_ndcg_at_20_diff1": 0.743433, + "nauc_ndcg_at_100_max": 0.320338, + "nauc_ndcg_at_100_std": -0.598332, + "nauc_ndcg_at_100_diff1": 0.743081, + "nauc_ndcg_at_1000_max": 0.321592, + "nauc_ndcg_at_1000_std": -0.594266, + "nauc_ndcg_at_1000_diff1": 0.742711, + "nauc_map_at_1_max": 0.236421, + "nauc_map_at_1_std": -0.520547, + "nauc_map_at_1_diff1": 0.785142, + "nauc_map_at_3_max": 0.288718, + "nauc_map_at_3_std": -0.64426, + "nauc_map_at_3_diff1": 0.750427, + "nauc_map_at_5_max": 0.298773, + "nauc_map_at_5_std": -0.650887, + "nauc_map_at_5_diff1": 0.746348, + "nauc_map_at_10_max": 0.305399, + "nauc_map_at_10_std": -0.635714, + "nauc_map_at_10_diff1": 0.744349, + "nauc_map_at_20_max": 0.307938, + "nauc_map_at_20_std": -0.623011, + "nauc_map_at_20_diff1": 0.743787, + "nauc_map_at_100_max": 0.30887, + "nauc_map_at_100_std": -0.613817, + "nauc_map_at_100_diff1": 0.742962, + "nauc_map_at_1000_max": 0.309135, + "nauc_map_at_1000_std": -0.61307, + "nauc_map_at_1000_diff1": 0.742901, + "nauc_recall_at_1_max": 0.236421, + "nauc_recall_at_1_std": -0.520547, + "nauc_recall_at_1_diff1": 0.785142, + "nauc_recall_at_3_max": 0.249435, + "nauc_recall_at_3_std": -0.7628, + "nauc_recall_at_3_diff1": 0.703111, + "nauc_recall_at_5_max": 0.249419, + "nauc_recall_at_5_std": -0.880645, + "nauc_recall_at_5_diff1": 0.69125, + "nauc_recall_at_10_max": 0.228575, + "nauc_recall_at_10_std": -1.024149, + "nauc_recall_at_10_diff1": 0.698238, + "nauc_recall_at_20_max": 0.205357, + "nauc_recall_at_20_std": -1.148009, + "nauc_recall_at_20_diff1": 0.701011, + "nauc_recall_at_100_max": 0.068155, + "nauc_recall_at_100_std": -1.339387, + "nauc_recall_at_100_diff1": 0.76857, + "nauc_recall_at_1000_max": -0.146695, + "nauc_recall_at_1000_std": -1.500684, + "nauc_recall_at_1000_diff1": 0.779582, + "nauc_precision_at_1_max": 0.332766, + "nauc_precision_at_1_std": -0.52977, + "nauc_precision_at_1_diff1": 0.764176, + "nauc_precision_at_3_max": 0.054244, + "nauc_precision_at_3_std": 0.044489, + "nauc_precision_at_3_diff1": -0.224617, + "nauc_precision_at_5_max": 0.002426, + "nauc_precision_at_5_std": 0.180339, + "nauc_precision_at_5_diff1": -0.340889, + "nauc_precision_at_10_max": -0.036423, + "nauc_precision_at_10_std": 0.305581, + "nauc_precision_at_10_diff1": -0.40481, + "nauc_precision_at_20_max": -0.053166, + "nauc_precision_at_20_std": 0.379037, + "nauc_precision_at_20_diff1": -0.422675, + "nauc_precision_at_100_max": -0.061917, + "nauc_precision_at_100_std": 0.448173, + "nauc_precision_at_100_diff1": -0.432039, + "nauc_precision_at_1000_max": -0.058959, + "nauc_precision_at_1000_std": 0.466794, + "nauc_precision_at_1000_diff1": -0.43352, + "nauc_mrr_at_1_max": 0.333126, + "nauc_mrr_at_1_std": -0.531267, + "nauc_mrr_at_1_diff1": 0.764176, + "nauc_mrr_at_3_max": 0.331662, + "nauc_mrr_at_3_std": -0.587466, + "nauc_mrr_at_3_diff1": 0.75004, + "nauc_mrr_at_5_max": 0.334293, + "nauc_mrr_at_5_std": -0.584107, + "nauc_mrr_at_5_diff1": 0.752415, + "nauc_mrr_at_10_max": 0.333427, + "nauc_mrr_at_10_std": -0.578479, + "nauc_mrr_at_10_diff1": 0.75343, + "nauc_mrr_at_20_max": 0.33335, + "nauc_mrr_at_20_std": -0.57663, + "nauc_mrr_at_20_diff1": 0.753402, + "nauc_mrr_at_100_max": 0.33323, + "nauc_mrr_at_100_std": -0.57613, + "nauc_mrr_at_100_diff1": 0.753467, + "nauc_mrr_at_1000_max": 0.333235, + "nauc_mrr_at_1000_std": -0.576115, + "nauc_mrr_at_1000_diff1": 0.753467, + "main_score": 0.8973, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 289.4270315170288, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/SCIDOCS.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/SCIDOCS.json new file mode 100644 index 000000000..18cae4dc9 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/SCIDOCS.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88", + "task_name": "SCIDOCS", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.465, + "ndcg_at_3": 0.38659, + "ndcg_at_5": 0.34364, + "ndcg_at_10": 0.40687, + "ndcg_at_20": 0.44822, + "ndcg_at_100": 0.50367, + "ndcg_at_1000": 0.54585, + "map_at_1": 0.09495, + "map_at_3": 0.18671, + "map_at_5": 0.23364, + "map_at_10": 0.27685, + "map_at_20": 0.29673, + "map_at_100": 0.31109, + "map_at_1000": 0.31433, + "recall_at_1": 0.09495, + "recall_at_3": 0.22223, + "recall_at_5": 0.31053, + "recall_at_10": 0.42682, + "recall_at_20": 0.52308, + "recall_at_100": 0.70135, + "recall_at_1000": 0.90337, + "precision_at_1": 0.465, + "precision_at_3": 0.363, + "precision_at_5": 0.3044, + "precision_at_10": 0.2092, + "precision_at_20": 0.1284, + "precision_at_100": 0.03449, + "precision_at_1000": 0.00445, + "mrr_at_1": 0.465, + "mrr_at_3": 0.573, + "mrr_at_5": 0.5926, + "mrr_at_10": 0.603045, + "mrr_at_20": 0.606841, + "mrr_at_100": 0.608631, + "mrr_at_1000": 0.608716, + "nauc_ndcg_at_1_max": 0.293214, + "nauc_ndcg_at_1_std": 0.167402, + "nauc_ndcg_at_1_diff1": 0.255968, + "nauc_ndcg_at_3_max": 0.34894, + "nauc_ndcg_at_3_std": 0.281459, + "nauc_ndcg_at_3_diff1": 0.158067, + "nauc_ndcg_at_5_max": 0.379759, + "nauc_ndcg_at_5_std": 0.337014, + "nauc_ndcg_at_5_diff1": 0.126296, + "nauc_ndcg_at_10_max": 0.426068, + "nauc_ndcg_at_10_std": 0.403413, + "nauc_ndcg_at_10_diff1": 0.128702, + "nauc_ndcg_at_20_max": 0.45188, + "nauc_ndcg_at_20_std": 0.442751, + "nauc_ndcg_at_20_diff1": 0.133693, + "nauc_ndcg_at_100_max": 0.452376, + "nauc_ndcg_at_100_std": 0.444992, + "nauc_ndcg_at_100_diff1": 0.148907, + "nauc_ndcg_at_1000_max": 0.438895, + "nauc_ndcg_at_1000_std": 0.422683, + "nauc_ndcg_at_1000_diff1": 0.148209, + "nauc_map_at_1_max": 0.286813, + "nauc_map_at_1_std": 0.163843, + "nauc_map_at_1_diff1": 0.251706, + "nauc_map_at_3_max": 0.332213, + "nauc_map_at_3_std": 0.269948, + "nauc_map_at_3_diff1": 0.139829, + "nauc_map_at_5_max": 0.365277, + "nauc_map_at_5_std": 0.323089, + "nauc_map_at_5_diff1": 0.105362, + "nauc_map_at_10_max": 0.407525, + "nauc_map_at_10_std": 0.384811, + "nauc_map_at_10_diff1": 0.104996, + "nauc_map_at_20_max": 0.429453, + "nauc_map_at_20_std": 0.417172, + "nauc_map_at_20_diff1": 0.109316, + "nauc_map_at_100_max": 0.432874, + "nauc_map_at_100_std": 0.423174, + "nauc_map_at_100_diff1": 0.11322, + "nauc_map_at_1000_max": 0.431905, + "nauc_map_at_1000_std": 0.422115, + "nauc_map_at_1000_diff1": 0.112752, + "nauc_recall_at_1_max": 0.286813, + "nauc_recall_at_1_std": 0.163843, + "nauc_recall_at_1_diff1": 0.251706, + "nauc_recall_at_3_max": 0.361579, + "nauc_recall_at_3_std": 0.319153, + "nauc_recall_at_3_diff1": 0.119143, + "nauc_recall_at_5_max": 0.38484, + "nauc_recall_at_5_std": 0.382559, + "nauc_recall_at_5_diff1": 0.064575, + "nauc_recall_at_10_max": 0.439049, + "nauc_recall_at_10_std": 0.469463, + "nauc_recall_at_10_diff1": 0.070757, + "nauc_recall_at_20_max": 0.466461, + "nauc_recall_at_20_std": 0.527865, + "nauc_recall_at_20_diff1": 0.072292, + "nauc_recall_at_100_max": 0.43519, + "nauc_recall_at_100_std": 0.511603, + "nauc_recall_at_100_diff1": 0.106438, + "nauc_recall_at_1000_max": 0.35312, + "nauc_recall_at_1000_std": 0.431113, + "nauc_recall_at_1000_diff1": 0.08166, + "nauc_precision_at_1_max": 0.293214, + "nauc_precision_at_1_std": 0.167402, + "nauc_precision_at_1_diff1": 0.255968, + "nauc_precision_at_3_max": 0.364825, + "nauc_precision_at_3_std": 0.32263, + "nauc_precision_at_3_diff1": 0.1194, + "nauc_precision_at_5_max": 0.389554, + "nauc_precision_at_5_std": 0.390655, + "nauc_precision_at_5_diff1": 0.065099, + "nauc_precision_at_10_max": 0.444624, + "nauc_precision_at_10_std": 0.477805, + "nauc_precision_at_10_diff1": 0.069943, + "nauc_precision_at_20_max": 0.467854, + "nauc_precision_at_20_std": 0.530109, + "nauc_precision_at_20_diff1": 0.072193, + "nauc_precision_at_100_max": 0.426579, + "nauc_precision_at_100_std": 0.504558, + "nauc_precision_at_100_diff1": 0.103314, + "nauc_precision_at_1000_max": 0.30065, + "nauc_precision_at_1000_std": 0.376868, + "nauc_precision_at_1000_diff1": 0.057053, + "nauc_mrr_at_1_max": 0.293214, + "nauc_mrr_at_1_std": 0.167402, + "nauc_mrr_at_1_diff1": 0.255968, + "nauc_mrr_at_3_max": 0.348344, + "nauc_mrr_at_3_std": 0.236379, + "nauc_mrr_at_3_diff1": 0.238412, + "nauc_mrr_at_5_max": 0.351867, + "nauc_mrr_at_5_std": 0.245859, + "nauc_mrr_at_5_diff1": 0.235854, + "nauc_mrr_at_10_max": 0.350206, + "nauc_mrr_at_10_std": 0.243563, + "nauc_mrr_at_10_diff1": 0.238027, + "nauc_mrr_at_20_max": 0.347613, + "nauc_mrr_at_20_std": 0.238879, + "nauc_mrr_at_20_diff1": 0.238763, + "nauc_mrr_at_100_max": 0.346391, + "nauc_mrr_at_100_std": 0.237577, + "nauc_mrr_at_100_diff1": 0.238819, + "nauc_mrr_at_1000_max": 0.346298, + "nauc_mrr_at_1000_std": 0.23744, + "nauc_mrr_at_1000_diff1": 0.238751, + "main_score": 0.40687, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 45.49591135978699, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/SciFact.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/SciFact.json new file mode 100644 index 000000000..75cd6b290 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/SciFact.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "0228b52cf27578f30900b9e5271d331663a030d7", + "task_name": "SciFact", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.72, + "ndcg_at_3": 0.79577, + "ndcg_at_5": 0.82586, + "ndcg_at_10": 0.84129, + "ndcg_at_20": 0.84851, + "ndcg_at_100": 0.85037, + "ndcg_at_1000": 0.85037, + "map_at_1": 0.68744, + "map_at_3": 0.7695, + "map_at_5": 0.79027, + "map_at_10": 0.79745, + "map_at_20": 0.80021, + "map_at_100": 0.8006, + "map_at_1000": 0.8006, + "recall_at_1": 0.68744, + "recall_at_3": 0.8495, + "recall_at_5": 0.92078, + "recall_at_10": 0.96617, + "recall_at_20": 0.99167, + "recall_at_100": 1.0, + "recall_at_1000": 1.0, + "precision_at_1": 0.72, + "precision_at_3": 0.30667, + "precision_at_5": 0.20467, + "precision_at_10": 0.10833, + "precision_at_20": 0.056, + "precision_at_100": 0.0113, + "precision_at_1000": 0.00113, + "mrr_at_1": 0.72, + "mrr_at_3": 0.783333, + "mrr_at_5": 0.799167, + "mrr_at_10": 0.804808, + "mrr_at_20": 0.806295, + "mrr_at_100": 0.806593, + "mrr_at_1000": 0.806593, + "nauc_ndcg_at_1_max": 0.110227, + "nauc_ndcg_at_1_std": -0.413818, + "nauc_ndcg_at_1_diff1": 0.678451, + "nauc_ndcg_at_3_max": 0.12417, + "nauc_ndcg_at_3_std": -0.560678, + "nauc_ndcg_at_3_diff1": 0.661864, + "nauc_ndcg_at_5_max": 0.097149, + "nauc_ndcg_at_5_std": -0.544778, + "nauc_ndcg_at_5_diff1": 0.660709, + "nauc_ndcg_at_10_max": 0.100481, + "nauc_ndcg_at_10_std": -0.530103, + "nauc_ndcg_at_10_diff1": 0.654975, + "nauc_ndcg_at_20_max": 0.104447, + "nauc_ndcg_at_20_std": -0.514411, + "nauc_ndcg_at_20_diff1": 0.66305, + "nauc_ndcg_at_100_max": 0.105114, + "nauc_ndcg_at_100_std": -0.509134, + "nauc_ndcg_at_100_diff1": 0.664661, + "nauc_ndcg_at_1000_max": 0.105114, + "nauc_ndcg_at_1000_std": -0.509134, + "nauc_ndcg_at_1000_diff1": 0.664661, + "nauc_map_at_1_max": 0.097749, + "nauc_map_at_1_std": -0.42442, + "nauc_map_at_1_diff1": 0.696292, + "nauc_map_at_3_max": 0.1117, + "nauc_map_at_3_std": -0.531002, + "nauc_map_at_3_diff1": 0.673252, + "nauc_map_at_5_max": 0.100632, + "nauc_map_at_5_std": -0.523343, + "nauc_map_at_5_diff1": 0.672538, + "nauc_map_at_10_max": 0.104164, + "nauc_map_at_10_std": -0.515081, + "nauc_map_at_10_diff1": 0.66871, + "nauc_map_at_20_max": 0.104185, + "nauc_map_at_20_std": -0.510903, + "nauc_map_at_20_diff1": 0.670864, + "nauc_map_at_100_max": 0.10417, + "nauc_map_at_100_std": -0.509973, + "nauc_map_at_100_diff1": 0.671061, + "nauc_map_at_1000_max": 0.10417, + "nauc_map_at_1000_std": -0.509973, + "nauc_map_at_1000_diff1": 0.671061, + "nauc_recall_at_1_max": 0.097749, + "nauc_recall_at_1_std": -0.42442, + "nauc_recall_at_1_diff1": 0.696292, + "nauc_recall_at_3_max": 0.156252, + "nauc_recall_at_3_std": -0.681735, + "nauc_recall_at_3_diff1": 0.636781, + "nauc_recall_at_5_max": 0.062329, + "nauc_recall_at_5_std": -0.720598, + "nauc_recall_at_5_diff1": 0.603973, + "nauc_recall_at_10_max": 0.012191, + "nauc_recall_at_10_std": -0.832013, + "nauc_recall_at_10_diff1": 0.499351, + "nauc_recall_at_20_max": 0.031466, + "nauc_recall_at_20_std": -0.877218, + "nauc_recall_at_20_diff1": 0.531466, + "nauc_recall_at_100_max": NaN, + "nauc_recall_at_100_std": NaN, + "nauc_recall_at_100_diff1": NaN, + "nauc_recall_at_1000_max": NaN, + "nauc_recall_at_1000_std": NaN, + "nauc_recall_at_1000_diff1": NaN, + "nauc_precision_at_1_max": 0.110227, + "nauc_precision_at_1_std": -0.413818, + "nauc_precision_at_1_diff1": 0.678451, + "nauc_precision_at_3_max": 0.15351, + "nauc_precision_at_3_std": -0.320099, + "nauc_precision_at_3_diff1": 0.242078, + "nauc_precision_at_5_max": 0.040197, + "nauc_precision_at_5_std": -0.076705, + "nauc_precision_at_5_diff1": -0.021522, + "nauc_precision_at_10_max": 0.052288, + "nauc_precision_at_10_std": 0.128876, + "nauc_precision_at_10_diff1": -0.224653, + "nauc_precision_at_20_max": 0.025358, + "nauc_precision_at_20_std": 0.240093, + "nauc_precision_at_20_diff1": -0.304318, + "nauc_precision_at_100_max": 0.018974, + "nauc_precision_at_100_std": 0.286152, + "nauc_precision_at_100_diff1": -0.332432, + "nauc_precision_at_1000_max": 0.018974, + "nauc_precision_at_1000_std": 0.286152, + "nauc_precision_at_1000_diff1": -0.332432, + "nauc_mrr_at_1_max": 0.110227, + "nauc_mrr_at_1_std": -0.413818, + "nauc_mrr_at_1_diff1": 0.678451, + "nauc_mrr_at_3_max": 0.118583, + "nauc_mrr_at_3_std": -0.518342, + "nauc_mrr_at_3_diff1": 0.660487, + "nauc_mrr_at_5_max": 0.103955, + "nauc_mrr_at_5_std": -0.50266, + "nauc_mrr_at_5_diff1": 0.655397, + "nauc_mrr_at_10_max": 0.103111, + "nauc_mrr_at_10_std": -0.498531, + "nauc_mrr_at_10_diff1": 0.654936, + "nauc_mrr_at_20_max": 0.104831, + "nauc_mrr_at_20_std": -0.495763, + "nauc_mrr_at_20_diff1": 0.657652, + "nauc_mrr_at_100_max": 0.105137, + "nauc_mrr_at_100_std": -0.495422, + "nauc_mrr_at_100_diff1": 0.658002, + "nauc_mrr_at_1000_max": 0.105137, + "nauc_mrr_at_1000_std": -0.495422, + "nauc_mrr_at_1000_diff1": 0.658002, + "main_score": 0.84129, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 11.949984312057495, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/TRECCOVID.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/TRECCOVID.json new file mode 100644 index 000000000..a10e6b0fe --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/TRECCOVID.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "bb9466bac8153a0349341eb1b22e06409e78ef4e", + "task_name": "TRECCOVID", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.74, + "ndcg_at_3": 0.64754, + "ndcg_at_5": 0.61072, + "ndcg_at_10": 0.573, + "ndcg_at_20": 0.5388, + "ndcg_at_100": 0.41767, + "ndcg_at_1000": 0.36256, + "map_at_1": 0.00207, + "map_at_3": 0.00512, + "map_at_5": 0.00779, + "map_at_10": 0.01306, + "map_at_20": 0.02268, + "map_at_100": 0.07062, + "map_at_1000": 0.14901, + "recall_at_1": 0.00207, + "recall_at_3": 0.00537, + "recall_at_5": 0.0085, + "recall_at_10": 0.01501, + "recall_at_20": 0.02855, + "recall_at_100": 0.10579, + "recall_at_1000": 0.33661, + "precision_at_1": 0.78, + "precision_at_3": 0.66667, + "precision_at_5": 0.636, + "precision_at_10": 0.592, + "precision_at_20": 0.562, + "precision_at_100": 0.427, + "precision_at_1000": 0.15268, + "mrr_at_1": 0.78, + "mrr_at_3": 0.836667, + "mrr_at_5": 0.845667, + "mrr_at_10": 0.851857, + "mrr_at_20": 0.85291, + "mrr_at_100": 0.85291, + "mrr_at_1000": 0.85291, + "nauc_ndcg_at_1_max": 0.392381, + "nauc_ndcg_at_1_std": 0.455578, + "nauc_ndcg_at_1_diff1": -0.055188, + "nauc_ndcg_at_3_max": 0.457943, + "nauc_ndcg_at_3_std": 0.445792, + "nauc_ndcg_at_3_diff1": -0.031822, + "nauc_ndcg_at_5_max": 0.482216, + "nauc_ndcg_at_5_std": 0.466917, + "nauc_ndcg_at_5_diff1": -0.074179, + "nauc_ndcg_at_10_max": 0.466109, + "nauc_ndcg_at_10_std": 0.475325, + "nauc_ndcg_at_10_diff1": -0.030068, + "nauc_ndcg_at_20_max": 0.402529, + "nauc_ndcg_at_20_std": 0.477238, + "nauc_ndcg_at_20_diff1": -0.06391, + "nauc_ndcg_at_100_max": 0.391329, + "nauc_ndcg_at_100_std": 0.604881, + "nauc_ndcg_at_100_diff1": -0.132915, + "nauc_ndcg_at_1000_max": 0.414183, + "nauc_ndcg_at_1000_std": 0.738869, + "nauc_ndcg_at_1000_diff1": -0.161401, + "nauc_map_at_1_max": 0.143129, + "nauc_map_at_1_std": 0.346453, + "nauc_map_at_1_diff1": 0.05718, + "nauc_map_at_3_max": 0.241286, + "nauc_map_at_3_std": 0.40966, + "nauc_map_at_3_diff1": 0.066085, + "nauc_map_at_5_max": 0.31109, + "nauc_map_at_5_std": 0.45919, + "nauc_map_at_5_diff1": 0.084709, + "nauc_map_at_10_max": 0.382424, + "nauc_map_at_10_std": 0.514002, + "nauc_map_at_10_diff1": 0.129258, + "nauc_map_at_20_max": 0.344696, + "nauc_map_at_20_std": 0.522152, + "nauc_map_at_20_diff1": 0.107713, + "nauc_map_at_100_max": 0.318547, + "nauc_map_at_100_std": 0.688659, + "nauc_map_at_100_diff1": -0.074522, + "nauc_map_at_1000_max": 0.386053, + "nauc_map_at_1000_std": 0.764998, + "nauc_map_at_1000_diff1": -0.137991, + "nauc_recall_at_1_max": 0.143129, + "nauc_recall_at_1_std": 0.346453, + "nauc_recall_at_1_diff1": 0.05718, + "nauc_recall_at_3_max": 0.23389, + "nauc_recall_at_3_std": 0.400527, + "nauc_recall_at_3_diff1": 0.057768, + "nauc_recall_at_5_max": 0.288314, + "nauc_recall_at_5_std": 0.441295, + "nauc_recall_at_5_diff1": 0.054858, + "nauc_recall_at_10_max": 0.368777, + "nauc_recall_at_10_std": 0.501625, + "nauc_recall_at_10_diff1": 0.138749, + "nauc_recall_at_20_max": 0.294566, + "nauc_recall_at_20_std": 0.501707, + "nauc_recall_at_20_diff1": 0.094113, + "nauc_recall_at_100_max": 0.256634, + "nauc_recall_at_100_std": 0.667291, + "nauc_recall_at_100_diff1": -0.082569, + "nauc_recall_at_1000_max": 0.355017, + "nauc_recall_at_1000_std": 0.711869, + "nauc_recall_at_1000_diff1": -0.171658, + "nauc_precision_at_1_max": 0.465109, + "nauc_precision_at_1_std": 0.555942, + "nauc_precision_at_1_diff1": -0.075625, + "nauc_precision_at_3_max": 0.475561, + "nauc_precision_at_3_std": 0.519691, + "nauc_precision_at_3_diff1": -0.085408, + "nauc_precision_at_5_max": 0.498623, + "nauc_precision_at_5_std": 0.526419, + "nauc_precision_at_5_diff1": -0.141367, + "nauc_precision_at_10_max": 0.466378, + "nauc_precision_at_10_std": 0.521483, + "nauc_precision_at_10_diff1": -0.043758, + "nauc_precision_at_20_max": 0.384533, + "nauc_precision_at_20_std": 0.521337, + "nauc_precision_at_20_diff1": -0.060843, + "nauc_precision_at_100_max": 0.386549, + "nauc_precision_at_100_std": 0.659443, + "nauc_precision_at_100_diff1": -0.159413, + "nauc_precision_at_1000_max": 0.368176, + "nauc_precision_at_1000_std": 0.520282, + "nauc_precision_at_1000_diff1": -0.24778, + "nauc_mrr_at_1_max": 0.465109, + "nauc_mrr_at_1_std": 0.555942, + "nauc_mrr_at_1_diff1": -0.075625, + "nauc_mrr_at_3_max": 0.510401, + "nauc_mrr_at_3_std": 0.60827, + "nauc_mrr_at_3_diff1": -0.081019, + "nauc_mrr_at_5_max": 0.522595, + "nauc_mrr_at_5_std": 0.609701, + "nauc_mrr_at_5_diff1": -0.100118, + "nauc_mrr_at_10_max": 0.517714, + "nauc_mrr_at_10_std": 0.608716, + "nauc_mrr_at_10_diff1": -0.067246, + "nauc_mrr_at_20_max": 0.515019, + "nauc_mrr_at_20_std": 0.605717, + "nauc_mrr_at_20_diff1": -0.074424, + "nauc_mrr_at_100_max": 0.515019, + "nauc_mrr_at_100_std": 0.605717, + "nauc_mrr_at_100_diff1": -0.074424, + "nauc_mrr_at_1000_max": 0.515019, + "nauc_mrr_at_1000_std": 0.605717, + "nauc_mrr_at_1000_diff1": -0.074424, + "main_score": 0.573, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 271.0138192176819, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/Touche2020.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/Touche2020.json new file mode 100644 index 000000000..7a13b3f4a --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/Touche2020.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f", + "task_name": "Touche2020", + "mteb_version": "1.29.16", + "scores": { + "test": [ + { + "ndcg_at_1": 0.40816, + "ndcg_at_3": 0.31068, + "ndcg_at_5": 0.28539, + "ndcg_at_10": 0.28132, + "ndcg_at_20": 0.28773, + "ndcg_at_100": 0.40141, + "ndcg_at_1000": 0.531, + "map_at_1": 0.03498, + "map_at_3": 0.06515, + "map_at_5": 0.08657, + "map_at_10": 0.11995, + "map_at_20": 0.146, + "map_at_100": 0.18607, + "map_at_1000": 0.20593, + "recall_at_1": 0.03498, + "recall_at_3": 0.07386, + "recall_at_5": 0.1094, + "recall_at_10": 0.18326, + "recall_at_20": 0.25798, + "recall_at_100": 0.50626, + "recall_at_1000": 0.90418, + "precision_at_1": 0.44898, + "precision_at_3": 0.31973, + "precision_at_5": 0.28163, + "precision_at_10": 0.2449, + "precision_at_20": 0.18163, + "precision_at_100": 0.08204, + "precision_at_1000": 0.01673, + "mrr_at_1": 0.44898, + "mrr_at_3": 0.503401, + "mrr_at_5": 0.52585, + "mrr_at_10": 0.546987, + "mrr_at_20": 0.552138, + "mrr_at_100": 0.554601, + "mrr_at_1000": 0.554601, + "nauc_ndcg_at_1_max": -0.251927, + "nauc_ndcg_at_1_std": -0.289009, + "nauc_ndcg_at_1_diff1": -0.105365, + "nauc_ndcg_at_3_max": -0.1566, + "nauc_ndcg_at_3_std": -0.214134, + "nauc_ndcg_at_3_diff1": -0.038212, + "nauc_ndcg_at_5_max": -0.137196, + "nauc_ndcg_at_5_std": -0.23012, + "nauc_ndcg_at_5_diff1": -0.032239, + "nauc_ndcg_at_10_max": -0.160928, + "nauc_ndcg_at_10_std": -0.170079, + "nauc_ndcg_at_10_diff1": -0.063702, + "nauc_ndcg_at_20_max": -0.17352, + "nauc_ndcg_at_20_std": -0.181615, + "nauc_ndcg_at_20_diff1": -0.017577, + "nauc_ndcg_at_100_max": -0.211794, + "nauc_ndcg_at_100_std": 0.036702, + "nauc_ndcg_at_100_diff1": -0.111532, + "nauc_ndcg_at_1000_max": -0.163273, + "nauc_ndcg_at_1000_std": 0.042914, + "nauc_ndcg_at_1000_diff1": -0.094769, + "nauc_map_at_1_max": -0.228193, + "nauc_map_at_1_std": -0.352076, + "nauc_map_at_1_diff1": -0.033774, + "nauc_map_at_3_max": -0.097136, + "nauc_map_at_3_std": -0.31414, + "nauc_map_at_3_diff1": 0.003407, + "nauc_map_at_5_max": -0.044073, + "nauc_map_at_5_std": -0.301934, + "nauc_map_at_5_diff1": -0.027507, + "nauc_map_at_10_max": -0.035281, + "nauc_map_at_10_std": -0.264283, + "nauc_map_at_10_diff1": -0.018015, + "nauc_map_at_20_max": -0.052564, + "nauc_map_at_20_std": -0.224545, + "nauc_map_at_20_diff1": 0.023797, + "nauc_map_at_100_max": -0.069874, + "nauc_map_at_100_std": -0.116128, + "nauc_map_at_100_diff1": -0.033814, + "nauc_map_at_1000_max": -0.060651, + "nauc_map_at_1000_std": -0.090339, + "nauc_map_at_1000_diff1": -0.034286, + "nauc_recall_at_1_max": -0.228193, + "nauc_recall_at_1_std": -0.352076, + "nauc_recall_at_1_diff1": -0.033774, + "nauc_recall_at_3_max": -0.114124, + "nauc_recall_at_3_std": -0.305851, + "nauc_recall_at_3_diff1": 0.019247, + "nauc_recall_at_5_max": -0.084204, + "nauc_recall_at_5_std": -0.315016, + "nauc_recall_at_5_diff1": -0.033254, + "nauc_recall_at_10_max": -0.112465, + "nauc_recall_at_10_std": -0.227447, + "nauc_recall_at_10_diff1": -0.051077, + "nauc_recall_at_20_max": -0.154701, + "nauc_recall_at_20_std": -0.16866, + "nauc_recall_at_20_diff1": 0.021607, + "nauc_recall_at_100_max": -0.22614, + "nauc_recall_at_100_std": 0.236214, + "nauc_recall_at_100_diff1": -0.197783, + "nauc_recall_at_1000_max": -0.211984, + "nauc_recall_at_1000_std": 0.624835, + "nauc_recall_at_1000_diff1": -0.263823, + "nauc_precision_at_1_max": -0.269871, + "nauc_precision_at_1_std": -0.340744, + "nauc_precision_at_1_diff1": -0.033296, + "nauc_precision_at_3_max": -0.085547, + "nauc_precision_at_3_std": -0.206278, + "nauc_precision_at_3_diff1": 0.043832, + "nauc_precision_at_5_max": -0.052518, + "nauc_precision_at_5_std": -0.225913, + "nauc_precision_at_5_diff1": 0.080374, + "nauc_precision_at_10_max": -0.093132, + "nauc_precision_at_10_std": -0.030131, + "nauc_precision_at_10_diff1": 0.03419, + "nauc_precision_at_20_max": -0.080959, + "nauc_precision_at_20_std": 0.065308, + "nauc_precision_at_20_diff1": 0.102983, + "nauc_precision_at_100_max": -0.067894, + "nauc_precision_at_100_std": 0.60656, + "nauc_precision_at_100_diff1": -0.095316, + "nauc_precision_at_1000_max": 0.295658, + "nauc_precision_at_1000_std": 0.375909, + "nauc_precision_at_1000_diff1": 0.071221, + "nauc_mrr_at_1_max": -0.269871, + "nauc_mrr_at_1_std": -0.340744, + "nauc_mrr_at_1_diff1": -0.033296, + "nauc_mrr_at_3_max": -0.257731, + "nauc_mrr_at_3_std": -0.318056, + "nauc_mrr_at_3_diff1": -0.003001, + "nauc_mrr_at_5_max": -0.259045, + "nauc_mrr_at_5_std": -0.305417, + "nauc_mrr_at_5_diff1": 0.008144, + "nauc_mrr_at_10_max": -0.283269, + "nauc_mrr_at_10_std": -0.28981, + "nauc_mrr_at_10_diff1": -0.006209, + "nauc_mrr_at_20_max": -0.275642, + "nauc_mrr_at_20_std": -0.297802, + "nauc_mrr_at_20_diff1": 0.002673, + "nauc_mrr_at_100_max": -0.274197, + "nauc_mrr_at_100_std": -0.299837, + "nauc_mrr_at_100_diff1": -0.000139, + "nauc_mrr_at_1000_max": -0.274197, + "nauc_mrr_at_1000_std": -0.299837, + "nauc_mrr_at_1000_diff1": -0.000139, + "main_score": 0.28132, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 529.1015980243683, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/model_meta.json b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/model_meta.json new file mode 100644 index 000000000..8444899f1 --- /dev/null +++ b/results/iamgroot42__spice/1d0fdb2b5d7aed81bba960cd8c85671674d49bdc/model_meta.json @@ -0,0 +1 @@ +{"name": "iamgroot42/spice", "revision": "1d0fdb2b5d7aed81bba960cd8c85671674d49bdc", "release_date": "2025-01-27", "languages": ["eng_Latn"], "n_parameters": 24000000, "max_tokens": 512, "embed_dim": 512, "license": "mit", "open_weights": true, "public_training_code": null, "public_training_data": null, "framework": ["PyTorch"], "reference": null, "similarity_fn_name": null, "use_instructions": null, "training_datasets": null, "adapted_from": null, "superseded_by": null, "loader": null} \ No newline at end of file