diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonCounterfactualClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonCounterfactualClassification.json new file mode 100644 index 0000000000..e7c82c25cd --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonCounterfactualClassification.json @@ -0,0 +1,95 @@ +{ + "dataset_revision": "e8379541af4e31359cca9fbcf4b00f2671dba205", + "task_name": "AmazonCounterfactualClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.774776, + "f1": 0.712683, + "f1_weighted": 0.793739, + "ap": 0.404116, + "ap_weighted": 0.404116, + "scores_per_experiment": [ + { + "accuracy": 0.786567, + "f1": 0.717657, + "f1_weighted": 0.802598, + "ap": 0.40172, + "ap_weighted": 0.40172 + }, + { + "accuracy": 0.832836, + "f1": 0.772042, + "f1_weighted": 0.843729, + "ap": 0.481723, + "ap_weighted": 0.481723 + }, + { + "accuracy": 0.740299, + "f1": 0.679405, + "f1_weighted": 0.764489, + "ap": 0.364821, + "ap_weighted": 0.364821 + }, + { + "accuracy": 0.786567, + "f1": 0.716548, + "f1_weighted": 0.802337, + "ap": 0.399409, + "ap_weighted": 0.399409 + }, + { + "accuracy": 0.791045, + "f1": 0.729293, + "f1_weighted": 0.808027, + "ap": 0.4231, + "ap_weighted": 0.4231 + }, + { + "accuracy": 0.759701, + "f1": 0.702879, + "f1_weighted": 0.782004, + "ap": 0.396272, + "ap_weighted": 0.396272 + }, + { + "accuracy": 0.81194, + "f1": 0.749751, + "f1_weighted": 0.825719, + "ap": 0.449344, + "ap_weighted": 0.449344 + }, + { + "accuracy": 0.777612, + "f1": 0.70581, + "f1_weighted": 0.794315, + "ap": 0.384948, + "ap_weighted": 0.384948 + }, + { + "accuracy": 0.738806, + "f1": 0.686808, + "f1_weighted": 0.764519, + "ap": 0.383435, + "ap_weighted": 0.383435 + }, + { + "accuracy": 0.722388, + "f1": 0.666635, + "f1_weighted": 0.749654, + "ap": 0.356392, + "ap_weighted": 0.356392 + } + ], + "main_score": 0.774776, + "hf_subset": "en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 7.348646640777588, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonPolarityClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonPolarityClassification.json new file mode 100644 index 0000000000..7641f16644 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonPolarityClassification.json @@ -0,0 +1,95 @@ +{ + "dataset_revision": "e2d317d38cd51312af73b3d32a06d1a08b442046", + "task_name": "AmazonPolarityClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.931718, + "f1": 0.931546, + "f1_weighted": 0.931546, + "ap": 0.899049, + "ap_weighted": 0.899049, + "scores_per_experiment": [ + { + "accuracy": 0.941712, + "f1": 0.941674, + "f1_weighted": 0.941674, + "ap": 0.906392, + "ap_weighted": 0.906392 + }, + { + "accuracy": 0.937562, + "f1": 0.937526, + "f1_weighted": 0.937526, + "ap": 0.901397, + "ap_weighted": 0.901397 + }, + { + "accuracy": 0.943928, + "f1": 0.943917, + "f1_weighted": 0.943917, + "ap": 0.924645, + "ap_weighted": 0.924645 + }, + { + "accuracy": 0.914325, + "f1": 0.914016, + "f1_weighted": 0.914016, + "ap": 0.902212, + "ap_weighted": 0.902212 + }, + { + "accuracy": 0.930848, + "f1": 0.930693, + "f1_weighted": 0.930693, + "ap": 0.9204, + "ap_weighted": 0.9204 + }, + { + "accuracy": 0.920752, + "f1": 0.920531, + "f1_weighted": 0.920531, + "ap": 0.870495, + "ap_weighted": 0.870495 + }, + { + "accuracy": 0.941295, + "f1": 0.941281, + "f1_weighted": 0.941281, + "ap": 0.909586, + "ap_weighted": 0.909586 + }, + { + "accuracy": 0.947608, + "f1": 0.947583, + "f1_weighted": 0.947583, + "ap": 0.915868, + "ap_weighted": 0.915868 + }, + { + "accuracy": 0.940945, + "f1": 0.940917, + "f1_weighted": 0.940917, + "ap": 0.90673, + "ap_weighted": 0.90673 + }, + { + "accuracy": 0.89821, + "f1": 0.897318, + "f1_weighted": 0.897318, + "ap": 0.832765, + "ap_weighted": 0.832765 + } + ], + "main_score": 0.931718, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 130.29326963424683, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonReviewsClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonReviewsClassification.json new file mode 100644 index 0000000000..7e13a5996c --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AmazonReviewsClassification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "1399c76144fd37290681b995c656ef9b2e06e26d", + "task_name": "AmazonReviewsClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.53572, + "f1": 0.530963, + "f1_weighted": 0.530963, + "scores_per_experiment": [ + { + "accuracy": 0.5258, + "f1": 0.519506, + "f1_weighted": 0.519506 + }, + { + "accuracy": 0.541, + "f1": 0.538943, + "f1_weighted": 0.538943 + }, + { + "accuracy": 0.5242, + "f1": 0.525775, + "f1_weighted": 0.525775 + }, + { + "accuracy": 0.5452, + "f1": 0.538755, + "f1_weighted": 0.538755 + }, + { + "accuracy": 0.5428, + "f1": 0.527215, + "f1_weighted": 0.527215 + }, + { + "accuracy": 0.5346, + "f1": 0.53011, + "f1_weighted": 0.53011 + }, + { + "accuracy": 0.523, + "f1": 0.520411, + "f1_weighted": 0.520411 + }, + { + "accuracy": 0.5618, + "f1": 0.565189, + "f1_weighted": 0.565189 + }, + { + "accuracy": 0.5332, + "f1": 0.530218, + "f1_weighted": 0.530218 + }, + { + "accuracy": 0.5256, + "f1": 0.513505, + "f1_weighted": 0.513505 + } + ], + "main_score": 0.53572, + "hf_subset": "en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 25.778754234313965, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AppsRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AppsRetrieval.json new file mode 100644 index 0000000000..cb00dc21ae --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AppsRetrieval.json @@ -0,0 +1,159 @@ +{ + "dataset_revision": "f22508f96b7a36c2415181ed8bb76f76e04ae2d5", + "task_name": "AppsRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.4239, + "ndcg_at_3": 0.51332, + "ndcg_at_5": 0.53895, + "ndcg_at_10": 0.56405, + "ndcg_at_20": 0.58239, + "ndcg_at_100": 0.60614, + "ndcg_at_1000": 0.61521, + "map_at_1": 0.4239, + "map_at_3": 0.4911, + "map_at_5": 0.50535, + "map_at_10": 0.51572, + "map_at_20": 0.52076, + "map_at_100": 0.52409, + "map_at_1000": 0.52443, + "recall_at_1": 0.4239, + "recall_at_3": 0.57769, + "recall_at_5": 0.63984, + "recall_at_10": 0.7174, + "recall_at_20": 0.78991, + "recall_at_100": 0.91713, + "recall_at_1000": 0.98831, + "precision_at_1": 0.4239, + "precision_at_3": 0.19256, + "precision_at_5": 0.12797, + "precision_at_10": 0.07174, + "precision_at_20": 0.0395, + "precision_at_100": 0.00917, + "precision_at_1000": 0.00099, + "mrr_at_1": 0.423639, + "mrr_at_3": 0.490969, + "mrr_at_5": 0.505219, + "mrr_at_10": 0.515558, + "mrr_at_20": 0.520623, + "mrr_at_100": 0.523951, + "mrr_at_1000": 0.524295, + "nauc_ndcg_at_1_max": 0.468151, + "nauc_ndcg_at_1_std": -0.09494, + "nauc_ndcg_at_1_diff1": 0.671995, + "nauc_ndcg_at_3_max": 0.464065, + "nauc_ndcg_at_3_std": -0.063099, + "nauc_ndcg_at_3_diff1": 0.599892, + "nauc_ndcg_at_5_max": 0.464353, + "nauc_ndcg_at_5_std": -0.043058, + "nauc_ndcg_at_5_diff1": 0.591136, + "nauc_ndcg_at_10_max": 0.466309, + "nauc_ndcg_at_10_std": -0.03698, + "nauc_ndcg_at_10_diff1": 0.58836, + "nauc_ndcg_at_20_max": 0.468328, + "nauc_ndcg_at_20_std": -0.030916, + "nauc_ndcg_at_20_diff1": 0.589795, + "nauc_ndcg_at_100_max": 0.466759, + "nauc_ndcg_at_100_std": -0.035153, + "nauc_ndcg_at_100_diff1": 0.596007, + "nauc_ndcg_at_1000_max": 0.468178, + "nauc_ndcg_at_1000_std": -0.040804, + "nauc_ndcg_at_1000_diff1": 0.601611, + "nauc_map_at_1_max": 0.468151, + "nauc_map_at_1_std": -0.09494, + "nauc_map_at_1_diff1": 0.671995, + "nauc_map_at_3_max": 0.464884, + "nauc_map_at_3_std": -0.070945, + "nauc_map_at_3_diff1": 0.617551, + "nauc_map_at_5_max": 0.465257, + "nauc_map_at_5_std": -0.060216, + "nauc_map_at_5_diff1": 0.613187, + "nauc_map_at_10_max": 0.465998, + "nauc_map_at_10_std": -0.058255, + "nauc_map_at_10_diff1": 0.612508, + "nauc_map_at_20_max": 0.466562, + "nauc_map_at_20_std": -0.056874, + "nauc_map_at_20_diff1": 0.613176, + "nauc_map_at_100_max": 0.466333, + "nauc_map_at_100_std": -0.05755, + "nauc_map_at_100_diff1": 0.614072, + "nauc_map_at_1000_max": 0.466443, + "nauc_map_at_1000_std": -0.05763, + "nauc_map_at_1000_diff1": 0.614281, + "nauc_recall_at_1_max": 0.468151, + "nauc_recall_at_1_std": -0.09494, + "nauc_recall_at_1_diff1": 0.671995, + "nauc_recall_at_3_max": 0.461629, + "nauc_recall_at_3_std": -0.038985, + "nauc_recall_at_3_diff1": 0.545665, + "nauc_recall_at_5_max": 0.461199, + "nauc_recall_at_5_std": 0.017203, + "nauc_recall_at_5_diff1": 0.516449, + "nauc_recall_at_10_max": 0.468571, + "nauc_recall_at_10_std": 0.052804, + "nauc_recall_at_10_diff1": 0.491747, + "nauc_recall_at_20_max": 0.480613, + "nauc_recall_at_20_std": 0.112502, + "nauc_recall_at_20_diff1": 0.473881, + "nauc_recall_at_100_max": 0.470175, + "nauc_recall_at_100_std": 0.22494, + "nauc_recall_at_100_diff1": 0.433198, + "nauc_recall_at_1000_max": 0.656147, + "nauc_recall_at_1000_std": 0.615157, + "nauc_recall_at_1000_diff1": 0.436366, + "nauc_precision_at_1_max": 0.468151, + "nauc_precision_at_1_std": -0.09494, + "nauc_precision_at_1_diff1": 0.671995, + "nauc_precision_at_3_max": 0.461629, + "nauc_precision_at_3_std": -0.038985, + "nauc_precision_at_3_diff1": 0.545665, + "nauc_precision_at_5_max": 0.461199, + "nauc_precision_at_5_std": 0.017203, + "nauc_precision_at_5_diff1": 0.516449, + "nauc_precision_at_10_max": 0.468571, + "nauc_precision_at_10_std": 0.052804, + "nauc_precision_at_10_diff1": 0.491747, + "nauc_precision_at_20_max": 0.480613, + "nauc_precision_at_20_std": 0.112502, + "nauc_precision_at_20_diff1": 0.473881, + "nauc_precision_at_100_max": 0.470175, + "nauc_precision_at_100_std": 0.22494, + "nauc_precision_at_100_diff1": 0.433198, + "nauc_precision_at_1000_max": 0.656147, + "nauc_precision_at_1000_std": 0.615157, + "nauc_precision_at_1000_diff1": 0.436366, + "nauc_mrr_at_1_max": 0.468517, + "nauc_mrr_at_1_std": -0.094522, + "nauc_mrr_at_1_diff1": 0.672672, + "nauc_mrr_at_3_max": 0.465076, + "nauc_mrr_at_3_std": -0.070753, + "nauc_mrr_at_3_diff1": 0.61789, + "nauc_mrr_at_5_max": 0.465453, + "nauc_mrr_at_5_std": -0.060021, + "nauc_mrr_at_5_diff1": 0.613534, + "nauc_mrr_at_10_max": 0.466179, + "nauc_mrr_at_10_std": -0.057996, + "nauc_mrr_at_10_diff1": 0.612895, + "nauc_mrr_at_20_max": 0.466762, + "nauc_mrr_at_20_std": -0.05667, + "nauc_mrr_at_20_diff1": 0.613534, + "nauc_mrr_at_100_max": 0.466536, + "nauc_mrr_at_100_std": -0.057343, + "nauc_mrr_at_100_diff1": 0.614432, + "nauc_mrr_at_1000_max": 0.466646, + "nauc_mrr_at_1000_std": -0.057424, + "nauc_mrr_at_1000_diff1": 0.614642, + "main_score": 0.56405, + "hf_subset": "default", + "languages": [ + "eng-Latn", + "python-Code" + ] + } + ] + }, + "evaluation_time": 71.75110912322998, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArguAna.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArguAna.json new file mode 100644 index 0000000000..25ad3e6684 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArguAna.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "c22ab2a51041ffd869aaddef7af8d8215647e41a", + "task_name": "ArguAna", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.51138, + "ndcg_at_3": 0.68576, + "ndcg_at_5": 0.7216, + "ndcg_at_10": 0.74555, + "ndcg_at_20": 0.75052, + "ndcg_at_100": 0.75183, + "ndcg_at_1000": 0.75183, + "map_at_1": 0.51138, + "map_at_3": 0.64237, + "map_at_5": 0.66232, + "map_at_10": 0.67249, + "map_at_20": 0.67392, + "map_at_100": 0.67415, + "map_at_1000": 0.67415, + "recall_at_1": 0.51138, + "recall_at_3": 0.81152, + "recall_at_5": 0.89829, + "recall_at_10": 0.97084, + "recall_at_20": 0.99004, + "recall_at_100": 0.99644, + "recall_at_1000": 0.99644, + "precision_at_1": 0.51138, + "precision_at_3": 0.27051, + "precision_at_5": 0.17966, + "precision_at_10": 0.09708, + "precision_at_20": 0.0495, + "precision_at_100": 0.00996, + "precision_at_1000": 0.001, + "mrr_at_1": 0.515647, + "mrr_at_3": 0.643551, + "mrr_at_5": 0.663857, + "mrr_at_10": 0.674029, + "mrr_at_20": 0.675457, + "mrr_at_100": 0.675687, + "mrr_at_1000": 0.675687, + "nauc_ndcg_at_1_max": -0.197761, + "nauc_ndcg_at_1_std": -0.193214, + "nauc_ndcg_at_1_diff1": 0.195527, + "nauc_ndcg_at_3_max": -0.129149, + "nauc_ndcg_at_3_std": -0.16005, + "nauc_ndcg_at_3_diff1": 0.191049, + "nauc_ndcg_at_5_max": -0.139129, + "nauc_ndcg_at_5_std": -0.155538, + "nauc_ndcg_at_5_diff1": 0.181118, + "nauc_ndcg_at_10_max": -0.148019, + "nauc_ndcg_at_10_std": -0.161181, + "nauc_ndcg_at_10_diff1": 0.189468, + "nauc_ndcg_at_20_max": -0.155176, + "nauc_ndcg_at_20_std": -0.165192, + "nauc_ndcg_at_20_diff1": 0.182507, + "nauc_ndcg_at_100_max": -0.158898, + "nauc_ndcg_at_100_std": -0.168269, + "nauc_ndcg_at_100_diff1": 0.182436, + "nauc_ndcg_at_1000_max": -0.158898, + "nauc_ndcg_at_1000_std": -0.168269, + "nauc_ndcg_at_1000_diff1": 0.182436, + "nauc_map_at_1_max": -0.197761, + "nauc_map_at_1_std": -0.193214, + "nauc_map_at_1_diff1": 0.195527, + "nauc_map_at_3_max": -0.152345, + "nauc_map_at_3_std": -0.171344, + "nauc_map_at_3_diff1": 0.186395, + "nauc_map_at_5_max": -0.15909, + "nauc_map_at_5_std": -0.170677, + "nauc_map_at_5_diff1": 0.181034, + "nauc_map_at_10_max": -0.163014, + "nauc_map_at_10_std": -0.172954, + "nauc_map_at_10_diff1": 0.184073, + "nauc_map_at_20_max": -0.164529, + "nauc_map_at_20_std": -0.173941, + "nauc_map_at_20_diff1": 0.182582, + "nauc_map_at_100_max": -0.165056, + "nauc_map_at_100_std": -0.174444, + "nauc_map_at_100_diff1": 0.182565, + "nauc_map_at_1000_max": -0.165056, + "nauc_map_at_1000_std": -0.174444, + "nauc_map_at_1000_diff1": 0.182565, + "nauc_recall_at_1_max": -0.197761, + "nauc_recall_at_1_std": -0.193214, + "nauc_recall_at_1_diff1": 0.195527, + "nauc_recall_at_3_max": -0.023342, + "nauc_recall_at_3_std": -0.108488, + "nauc_recall_at_3_diff1": 0.215834, + "nauc_recall_at_5_max": 0.008046, + "nauc_recall_at_5_std": -0.03914, + "nauc_recall_at_5_diff1": 0.186061, + "nauc_recall_at_10_max": 0.198821, + "nauc_recall_at_10_std": 0.125064, + "nauc_recall_at_10_diff1": 0.356986, + "nauc_recall_at_20_max": 0.311123, + "nauc_recall_at_20_std": 0.386643, + "nauc_recall_at_20_diff1": 0.152131, + "nauc_recall_at_100_max": 0.184725, + "nauc_recall_at_100_std": 0.635385, + "nauc_recall_at_100_diff1": 0.084392, + "nauc_recall_at_1000_max": 0.184725, + "nauc_recall_at_1000_std": 0.635385, + "nauc_recall_at_1000_diff1": 0.084392, + "nauc_precision_at_1_max": -0.197761, + "nauc_precision_at_1_std": -0.193214, + "nauc_precision_at_1_diff1": 0.195527, + "nauc_precision_at_3_max": -0.023342, + "nauc_precision_at_3_std": -0.108488, + "nauc_precision_at_3_diff1": 0.215834, + "nauc_precision_at_5_max": 0.008046, + "nauc_precision_at_5_std": -0.03914, + "nauc_precision_at_5_diff1": 0.186061, + "nauc_precision_at_10_max": 0.198821, + "nauc_precision_at_10_std": 0.125064, + "nauc_precision_at_10_diff1": 0.356986, + "nauc_precision_at_20_max": 0.311123, + "nauc_precision_at_20_std": 0.386643, + "nauc_precision_at_20_diff1": 0.152131, + "nauc_precision_at_100_max": 0.184725, + "nauc_precision_at_100_std": 0.635385, + "nauc_precision_at_100_diff1": 0.084392, + "nauc_precision_at_1000_max": 0.184725, + "nauc_precision_at_1000_std": 0.635385, + "nauc_precision_at_1000_diff1": 0.084392, + "nauc_mrr_at_1_max": -0.197348, + "nauc_mrr_at_1_std": -0.184673, + "nauc_mrr_at_1_diff1": 0.184015, + "nauc_mrr_at_3_max": -0.1585, + "nauc_mrr_at_3_std": -0.169397, + "nauc_mrr_at_3_diff1": 0.171302, + "nauc_mrr_at_5_max": -0.163461, + "nauc_mrr_at_5_std": -0.166808, + "nauc_mrr_at_5_diff1": 0.167117, + "nauc_mrr_at_10_max": -0.16757, + "nauc_mrr_at_10_std": -0.16893, + "nauc_mrr_at_10_diff1": 0.16959, + "nauc_mrr_at_20_max": -0.169114, + "nauc_mrr_at_20_std": -0.169895, + "nauc_mrr_at_20_diff1": 0.168013, + "nauc_mrr_at_100_max": -0.169646, + "nauc_mrr_at_100_std": -0.170395, + "nauc_mrr_at_100_diff1": 0.167983, + "nauc_mrr_at_1000_max": -0.169646, + "nauc_mrr_at_1000_std": -0.170395, + "nauc_mrr_at_1000_diff1": 0.167983, + "main_score": 0.74555, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 11.137962579727173, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArxivClusteringP2P.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArxivClusteringP2P.json new file mode 100644 index 0000000000..3fbfa4b1f7 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArxivClusteringP2P.json @@ -0,0 +1,53 @@ +{ + "dataset_revision": "a122ad7f3f0291bf49cc6f4d32aa80929df69d5d", + "task_name": "ArxivClusteringP2P", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.484904, + "v_measure_std": 0.139002, + "v_measures": [ + 0.501068, + 0.50512, + 0.498116, + 0.486214, + 0.499504, + 0.463445, + 0.459985, + 0.485717, + 0.48679, + 0.483597, + 0.566444, + 0.569411, + 0.565953, + 0.562226, + 0.570999, + 0.569159, + 0.558643, + 0.566468, + 0.56469, + 0.567975, + 0.535372, + 0.28786, + 0.471878, + 0.417082, + 0.360013, + 0.278333, + 0.302666, + 0.233841, + 0.330557, + 1.0, + 0.282884 + ], + "main_score": 0.484904, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 128.57761693000793, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArxivClusteringS2S.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArxivClusteringS2S.json new file mode 100644 index 0000000000..191b06cd0b --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ArxivClusteringS2S.json @@ -0,0 +1,53 @@ +{ + "dataset_revision": "f910caf1a6075f7329cdf8c1a6135696f37dbd53", + "task_name": "ArxivClusteringS2S", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.428325, + "v_measure_std": 0.142066, + "v_measures": [ + 0.429042, + 0.451686, + 0.444571, + 0.431784, + 0.423388, + 0.446913, + 0.426681, + 0.440458, + 0.439653, + 0.432534, + 0.491187, + 0.502175, + 0.500589, + 0.501042, + 0.500935, + 0.498296, + 0.498302, + 0.494469, + 0.498679, + 0.497697, + 0.463844, + 0.229918, + 0.359698, + 0.371051, + 0.312968, + 0.223137, + 0.260583, + 0.190319, + 0.286372, + 1.0, + 0.230109 + ], + "main_score": 0.428325, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 60.15584969520569, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AskUbuntuDupQuestions.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AskUbuntuDupQuestions.json new file mode 100644 index 0000000000..58b9825870 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/AskUbuntuDupQuestions.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "2000358ca161889fa9c082cb41daa8dcfb161a54", + "task_name": "AskUbuntuDupQuestions", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "map": 0.63343, + "mrr": 0.765471, + "nAUC_map_max": 0.201553, + "nAUC_map_std": 0.149848, + "nAUC_map_diff1": 0.122445, + "nAUC_mrr_max": 0.30655, + "nAUC_mrr_std": 0.179701, + "nAUC_mrr_diff1": 0.191408, + "main_score": 0.63343, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.4938678741455078, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BIOSSES.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BIOSSES.json new file mode 100644 index 0000000000..3a43e29684 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BIOSSES.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "d3fb88f8f02e40887cd149695127462bbcf29b4a", + "task_name": "BIOSSES", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.862969, + "spearman": 0.84776, + "cosine_pearson": 0.862969, + "cosine_spearman": 0.84776, + "manhattan_pearson": 0.837777, + "manhattan_spearman": 0.845284, + "euclidean_pearson": 0.835384, + "euclidean_spearman": 0.842369, + "main_score": 0.84776, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.10980749130249023, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/Banking77Classification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/Banking77Classification.json new file mode 100644 index 0000000000..3ef5f2aa02 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/Banking77Classification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "0fd18e25b25c072e09e0d92ab615fda904d66300", + "task_name": "Banking77Classification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.862273, + "f1": 0.861745, + "f1_weighted": 0.861745, + "scores_per_experiment": [ + { + "accuracy": 0.87013, + "f1": 0.86953, + "f1_weighted": 0.86953 + }, + { + "accuracy": 0.864286, + "f1": 0.863738, + "f1_weighted": 0.863738 + }, + { + "accuracy": 0.867208, + "f1": 0.866305, + "f1_weighted": 0.866305 + }, + { + "accuracy": 0.869156, + "f1": 0.869719, + "f1_weighted": 0.869719 + }, + { + "accuracy": 0.866558, + "f1": 0.866739, + "f1_weighted": 0.866739 + }, + { + "accuracy": 0.84513, + "f1": 0.844087, + "f1_weighted": 0.844087 + }, + { + "accuracy": 0.855844, + "f1": 0.855254, + "f1_weighted": 0.855254 + }, + { + "accuracy": 0.850974, + "f1": 0.849352, + "f1_weighted": 0.849352 + }, + { + "accuracy": 0.865584, + "f1": 0.865026, + "f1_weighted": 0.865026 + }, + { + "accuracy": 0.867857, + "f1": 0.8677, + "f1_weighted": 0.8677 + } + ], + "main_score": 0.862273, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 18.690781354904175, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BiorxivClusteringP2P.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..7d3c041d51 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "task_name": "BiorxivClusteringP2P", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.389099, + "v_measure_std": 0.008446, + "v_measures": [ + 0.384816, + 0.385433, + 0.402986, + 0.382425, + 0.3841, + 0.391366, + 0.376855, + 0.40203, + 0.397307, + 0.383669 + ], + "main_score": 0.389099, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 21.839644193649292, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BiorxivClusteringS2S.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..8feb26b8e1 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "task_name": "BiorxivClusteringS2S", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.367982, + "v_measure_std": 0.009708, + "v_measures": [ + 0.369257, + 0.37878, + 0.373136, + 0.357176, + 0.354509, + 0.378606, + 0.354997, + 0.38171, + 0.362662, + 0.368989 + ], + "main_score": 0.367982, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 7.569418907165527, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/COIRCodeSearchNetRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/COIRCodeSearchNetRetrieval.json new file mode 100644 index 0000000000..8c110162bd --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/COIRCodeSearchNetRetrieval.json @@ -0,0 +1,893 @@ +{ + "dataset_revision": "4adc7bc41202b5c13543c9c886a25f340634dab3", + "task_name": "COIRCodeSearchNetRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.80875, + "ndcg_at_3": 0.86448, + "ndcg_at_5": 0.87443, + "ndcg_at_10": 0.88172, + "ndcg_at_20": 0.88558, + "ndcg_at_100": 0.88944, + "ndcg_at_1000": 0.89078, + "map_at_1": 0.80875, + "map_at_3": 0.85139, + "map_at_5": 0.85694, + "map_at_10": 0.86001, + "map_at_20": 0.86107, + "map_at_100": 0.86163, + "map_at_1000": 0.86167, + "recall_at_1": 0.80875, + "recall_at_3": 0.90213, + "recall_at_5": 0.92613, + "recall_at_10": 0.94838, + "recall_at_20": 0.9636, + "recall_at_100": 0.98411, + "recall_at_1000": 0.99484, + "precision_at_1": 0.80875, + "precision_at_3": 0.30071, + "precision_at_5": 0.18523, + "precision_at_10": 0.09484, + "precision_at_20": 0.04818, + "precision_at_100": 0.00984, + "precision_at_1000": 0.00099, + "mrr_at_1": 0.808755, + "mrr_at_3": 0.851388, + "mrr_at_5": 0.856941, + "mrr_at_10": 0.860012, + "mrr_at_20": 0.861074, + "mrr_at_100": 0.861626, + "mrr_at_1000": 0.861673, + "nauc_ndcg_at_1_max": 0.682081, + "nauc_ndcg_at_1_std": -0.102206, + "nauc_ndcg_at_1_diff1": 0.842817, + "nauc_ndcg_at_3_max": 0.728937, + "nauc_ndcg_at_3_std": -0.056468, + "nauc_ndcg_at_3_diff1": 0.81739, + "nauc_ndcg_at_5_max": 0.730947, + "nauc_ndcg_at_5_std": -0.051439, + "nauc_ndcg_at_5_diff1": 0.820668, + "nauc_ndcg_at_10_max": 0.730143, + "nauc_ndcg_at_10_std": -0.042501, + "nauc_ndcg_at_10_diff1": 0.822962, + "nauc_ndcg_at_20_max": 0.729294, + "nauc_ndcg_at_20_std": -0.043713, + "nauc_ndcg_at_20_diff1": 0.823548, + "nauc_ndcg_at_100_max": 0.725423, + "nauc_ndcg_at_100_std": -0.046948, + "nauc_ndcg_at_100_diff1": 0.825062, + "nauc_ndcg_at_1000_max": 0.723429, + "nauc_ndcg_at_1000_std": -0.051922, + "nauc_ndcg_at_1000_diff1": 0.82522, + "nauc_map_at_1_max": 0.682081, + "nauc_map_at_1_std": -0.102206, + "nauc_map_at_1_diff1": 0.842817, + "nauc_map_at_3_max": 0.716312, + "nauc_map_at_3_std": -0.069952, + "nauc_map_at_3_diff1": 0.824764, + "nauc_map_at_5_max": 0.71686, + "nauc_map_at_5_std": -0.068027, + "nauc_map_at_5_diff1": 0.826639, + "nauc_map_at_10_max": 0.716306, + "nauc_map_at_10_std": -0.065019, + "nauc_map_at_10_diff1": 0.82756, + "nauc_map_at_20_max": 0.71599, + "nauc_map_at_20_std": -0.065516, + "nauc_map_at_20_diff1": 0.827729, + "nauc_map_at_100_max": 0.715491, + "nauc_map_at_100_std": -0.065993, + "nauc_map_at_100_diff1": 0.827929, + "nauc_map_at_1000_max": 0.715432, + "nauc_map_at_1000_std": -0.066118, + "nauc_map_at_1000_diff1": 0.827936, + "nauc_recall_at_1_max": 0.682081, + "nauc_recall_at_1_std": -0.102206, + "nauc_recall_at_1_diff1": 0.842817, + "nauc_recall_at_3_max": 0.780886, + "nauc_recall_at_3_std": -0.000201, + "nauc_recall_at_3_diff1": 0.78669, + "nauc_recall_at_5_max": 0.80516, + "nauc_recall_at_5_std": 0.038001, + "nauc_recall_at_5_diff1": 0.789997, + "nauc_recall_at_10_max": 0.831013, + "nauc_recall_at_10_std": 0.133861, + "nauc_recall_at_10_diff1": 0.792651, + "nauc_recall_at_20_max": 0.863403, + "nauc_recall_at_20_std": 0.194104, + "nauc_recall_at_20_diff1": 0.786999, + "nauc_recall_at_100_max": 0.899147, + "nauc_recall_at_100_std": 0.387695, + "nauc_recall_at_100_diff1": 0.791989, + "nauc_recall_at_1000_max": 0.937914, + "nauc_recall_at_1000_std": 0.456533, + "nauc_recall_at_1000_diff1": 0.744587, + "nauc_precision_at_1_max": 0.682081, + "nauc_precision_at_1_std": -0.102206, + "nauc_precision_at_1_diff1": 0.842817, + "nauc_precision_at_3_max": 0.780886, + "nauc_precision_at_3_std": -0.000201, + "nauc_precision_at_3_diff1": 0.78669, + "nauc_precision_at_5_max": 0.80516, + "nauc_precision_at_5_std": 0.038001, + "nauc_precision_at_5_diff1": 0.789997, + "nauc_precision_at_10_max": 0.831013, + "nauc_precision_at_10_std": 0.133861, + "nauc_precision_at_10_diff1": 0.792651, + "nauc_precision_at_20_max": 0.863403, + "nauc_precision_at_20_std": 0.194104, + "nauc_precision_at_20_diff1": 0.786999, + "nauc_precision_at_100_max": 0.899147, + "nauc_precision_at_100_std": 0.387695, + "nauc_precision_at_100_diff1": 0.791989, + "nauc_precision_at_1000_max": 0.937914, + "nauc_precision_at_1000_std": 0.456533, + "nauc_precision_at_1000_diff1": 0.744587, + "nauc_mrr_at_1_max": 0.682081, + "nauc_mrr_at_1_std": -0.102206, + "nauc_mrr_at_1_diff1": 0.842817, + "nauc_mrr_at_3_max": 0.716312, + "nauc_mrr_at_3_std": -0.069952, + "nauc_mrr_at_3_diff1": 0.824764, + "nauc_mrr_at_5_max": 0.71686, + "nauc_mrr_at_5_std": -0.068027, + "nauc_mrr_at_5_diff1": 0.826639, + "nauc_mrr_at_10_max": 0.716306, + "nauc_mrr_at_10_std": -0.065019, + "nauc_mrr_at_10_diff1": 0.82756, + "nauc_mrr_at_20_max": 0.71599, + "nauc_mrr_at_20_std": -0.065516, + "nauc_mrr_at_20_diff1": 0.827729, + "nauc_mrr_at_100_max": 0.715491, + "nauc_mrr_at_100_std": -0.065993, + "nauc_mrr_at_100_diff1": 0.827929, + "nauc_mrr_at_1000_max": 0.715432, + "nauc_mrr_at_1000_std": -0.066118, + "nauc_mrr_at_1000_diff1": 0.827936, + "main_score": 0.88172, + "hf_subset": "python", + "languages": [ + "python-Code" + ] + }, + { + "ndcg_at_1": 0.66545, + "ndcg_at_3": 0.73782, + "ndcg_at_5": 0.74916, + "ndcg_at_10": 0.76034, + "ndcg_at_20": 0.76683, + "ndcg_at_100": 0.77661, + "ndcg_at_1000": 0.78162, + "map_at_1": 0.66545, + "map_at_3": 0.72045, + "map_at_5": 0.72679, + "map_at_10": 0.73145, + "map_at_20": 0.73325, + "map_at_100": 0.73466, + "map_at_1000": 0.73484, + "recall_at_1": 0.66545, + "recall_at_3": 0.78791, + "recall_at_5": 0.81525, + "recall_at_10": 0.84959, + "recall_at_20": 0.87511, + "recall_at_100": 0.92707, + "recall_at_1000": 0.96718, + "precision_at_1": 0.66545, + "precision_at_3": 0.26264, + "precision_at_5": 0.16305, + "precision_at_10": 0.08496, + "precision_at_20": 0.04376, + "precision_at_100": 0.00927, + "precision_at_1000": 0.00097, + "mrr_at_1": 0.665451, + "mrr_at_3": 0.72045, + "mrr_at_5": 0.726785, + "mrr_at_10": 0.731453, + "mrr_at_20": 0.733252, + "mrr_at_100": 0.734662, + "mrr_at_1000": 0.734837, + "nauc_ndcg_at_1_max": 0.686747, + "nauc_ndcg_at_1_std": 0.008874, + "nauc_ndcg_at_1_diff1": 0.818034, + "nauc_ndcg_at_3_max": 0.741776, + "nauc_ndcg_at_3_std": 0.055559, + "nauc_ndcg_at_3_diff1": 0.784154, + "nauc_ndcg_at_5_max": 0.744999, + "nauc_ndcg_at_5_std": 0.069102, + "nauc_ndcg_at_5_diff1": 0.781723, + "nauc_ndcg_at_10_max": 0.743785, + "nauc_ndcg_at_10_std": 0.073099, + "nauc_ndcg_at_10_diff1": 0.780335, + "nauc_ndcg_at_20_max": 0.742414, + "nauc_ndcg_at_20_std": 0.076319, + "nauc_ndcg_at_20_diff1": 0.781692, + "nauc_ndcg_at_100_max": 0.73824, + "nauc_ndcg_at_100_std": 0.076121, + "nauc_ndcg_at_100_diff1": 0.781986, + "nauc_ndcg_at_1000_max": 0.736286, + "nauc_ndcg_at_1000_std": 0.070558, + "nauc_ndcg_at_1000_diff1": 0.784239, + "nauc_map_at_1_max": 0.686747, + "nauc_map_at_1_std": 0.008874, + "nauc_map_at_1_diff1": 0.818034, + "nauc_map_at_3_max": 0.728079, + "nauc_map_at_3_std": 0.043878, + "nauc_map_at_3_diff1": 0.793165, + "nauc_map_at_5_max": 0.729354, + "nauc_map_at_5_std": 0.050454, + "nauc_map_at_5_diff1": 0.792034, + "nauc_map_at_10_max": 0.728762, + "nauc_map_at_10_std": 0.051835, + "nauc_map_at_10_diff1": 0.791758, + "nauc_map_at_20_max": 0.728398, + "nauc_map_at_20_std": 0.05246, + "nauc_map_at_20_diff1": 0.792214, + "nauc_map_at_100_max": 0.727717, + "nauc_map_at_100_std": 0.05223, + "nauc_map_at_100_diff1": 0.792222, + "nauc_map_at_1000_max": 0.727645, + "nauc_map_at_1000_std": 0.052067, + "nauc_map_at_1000_diff1": 0.792284, + "nauc_recall_at_1_max": 0.686747, + "nauc_recall_at_1_std": 0.008874, + "nauc_recall_at_1_diff1": 0.818034, + "nauc_recall_at_3_max": 0.789742, + "nauc_recall_at_3_std": 0.096502, + "nauc_recall_at_3_diff1": 0.752265, + "nauc_recall_at_5_max": 0.806328, + "nauc_recall_at_5_std": 0.144502, + "nauc_recall_at_5_diff1": 0.741101, + "nauc_recall_at_10_max": 0.812386, + "nauc_recall_at_10_std": 0.176504, + "nauc_recall_at_10_diff1": 0.725836, + "nauc_recall_at_20_max": 0.814765, + "nauc_recall_at_20_std": 0.217165, + "nauc_recall_at_20_diff1": 0.72433, + "nauc_recall_at_100_max": 0.807578, + "nauc_recall_at_100_std": 0.311424, + "nauc_recall_at_100_diff1": 0.694565, + "nauc_recall_at_1000_max": 0.804249, + "nauc_recall_at_1000_std": 0.331413, + "nauc_recall_at_1000_diff1": 0.697192, + "nauc_precision_at_1_max": 0.686747, + "nauc_precision_at_1_std": 0.008874, + "nauc_precision_at_1_diff1": 0.818034, + "nauc_precision_at_3_max": 0.789742, + "nauc_precision_at_3_std": 0.096502, + "nauc_precision_at_3_diff1": 0.752265, + "nauc_precision_at_5_max": 0.806328, + "nauc_precision_at_5_std": 0.144502, + "nauc_precision_at_5_diff1": 0.741101, + "nauc_precision_at_10_max": 0.812386, + "nauc_precision_at_10_std": 0.176504, + "nauc_precision_at_10_diff1": 0.725836, + "nauc_precision_at_20_max": 0.814765, + "nauc_precision_at_20_std": 0.217165, + "nauc_precision_at_20_diff1": 0.72433, + "nauc_precision_at_100_max": 0.807578, + "nauc_precision_at_100_std": 0.311424, + "nauc_precision_at_100_diff1": 0.694565, + "nauc_precision_at_1000_max": 0.804249, + "nauc_precision_at_1000_std": 0.331413, + "nauc_precision_at_1000_diff1": 0.697192, + "nauc_mrr_at_1_max": 0.686747, + "nauc_mrr_at_1_std": 0.008874, + "nauc_mrr_at_1_diff1": 0.818034, + "nauc_mrr_at_3_max": 0.728079, + "nauc_mrr_at_3_std": 0.043878, + "nauc_mrr_at_3_diff1": 0.793165, + "nauc_mrr_at_5_max": 0.729354, + "nauc_mrr_at_5_std": 0.050454, + "nauc_mrr_at_5_diff1": 0.792034, + "nauc_mrr_at_10_max": 0.728762, + "nauc_mrr_at_10_std": 0.051835, + "nauc_mrr_at_10_diff1": 0.791758, + "nauc_mrr_at_20_max": 0.728398, + "nauc_mrr_at_20_std": 0.05246, + "nauc_mrr_at_20_diff1": 0.792214, + "nauc_mrr_at_100_max": 0.727717, + "nauc_mrr_at_100_std": 0.05223, + "nauc_mrr_at_100_diff1": 0.792222, + "nauc_mrr_at_1000_max": 0.727645, + "nauc_mrr_at_1000_std": 0.052067, + "nauc_mrr_at_1000_diff1": 0.792284, + "main_score": 0.76034, + "hf_subset": "javascript", + "languages": [ + "javascript-Code" + ] + }, + { + "ndcg_at_1": 0.81051, + "ndcg_at_3": 0.86588, + "ndcg_at_5": 0.87667, + "ndcg_at_10": 0.88316, + "ndcg_at_20": 0.88761, + "ndcg_at_100": 0.89131, + "ndcg_at_1000": 0.89257, + "map_at_1": 0.81051, + "map_at_3": 0.85285, + "map_at_5": 0.85886, + "map_at_10": 0.86156, + "map_at_20": 0.8628, + "map_at_100": 0.86333, + "map_at_1000": 0.86338, + "recall_at_1": 0.81051, + "recall_at_3": 0.90335, + "recall_at_5": 0.92945, + "recall_at_10": 0.9494, + "recall_at_20": 0.96688, + "recall_at_100": 0.98646, + "recall_at_1000": 0.99618, + "precision_at_1": 0.81051, + "precision_at_3": 0.30112, + "precision_at_5": 0.18589, + "precision_at_10": 0.09494, + "precision_at_20": 0.04834, + "precision_at_100": 0.00986, + "precision_at_1000": 0.001, + "mrr_at_1": 0.810515, + "mrr_at_3": 0.852848, + "mrr_at_5": 0.858857, + "mrr_at_10": 0.861564, + "mrr_at_20": 0.862796, + "mrr_at_100": 0.863331, + "mrr_at_1000": 0.863382, + "nauc_ndcg_at_1_max": 0.598834, + "nauc_ndcg_at_1_std": -0.447766, + "nauc_ndcg_at_1_diff1": 0.87385, + "nauc_ndcg_at_3_max": 0.638229, + "nauc_ndcg_at_3_std": -0.478464, + "nauc_ndcg_at_3_diff1": 0.847976, + "nauc_ndcg_at_5_max": 0.642855, + "nauc_ndcg_at_5_std": -0.474171, + "nauc_ndcg_at_5_diff1": 0.850908, + "nauc_ndcg_at_10_max": 0.646052, + "nauc_ndcg_at_10_std": -0.458513, + "nauc_ndcg_at_10_diff1": 0.853019, + "nauc_ndcg_at_20_max": 0.645782, + "nauc_ndcg_at_20_std": -0.456078, + "nauc_ndcg_at_20_diff1": 0.854936, + "nauc_ndcg_at_100_max": 0.640743, + "nauc_ndcg_at_100_std": -0.448549, + "nauc_ndcg_at_100_diff1": 0.855502, + "nauc_ndcg_at_1000_max": 0.637933, + "nauc_ndcg_at_1000_std": -0.453825, + "nauc_ndcg_at_1000_diff1": 0.855747, + "nauc_map_at_1_max": 0.598834, + "nauc_map_at_1_std": -0.447766, + "nauc_map_at_1_diff1": 0.87385, + "nauc_map_at_3_max": 0.627529, + "nauc_map_at_3_std": -0.470975, + "nauc_map_at_3_diff1": 0.855477, + "nauc_map_at_5_max": 0.629334, + "nauc_map_at_5_std": -0.468663, + "nauc_map_at_5_diff1": 0.857288, + "nauc_map_at_10_max": 0.630316, + "nauc_map_at_10_std": -0.463083, + "nauc_map_at_10_diff1": 0.858146, + "nauc_map_at_20_max": 0.630139, + "nauc_map_at_20_std": -0.462541, + "nauc_map_at_20_diff1": 0.858622, + "nauc_map_at_100_max": 0.629519, + "nauc_map_at_100_std": -0.461783, + "nauc_map_at_100_diff1": 0.858677, + "nauc_map_at_1000_max": 0.629434, + "nauc_map_at_1000_std": -0.461908, + "nauc_map_at_1000_diff1": 0.858685, + "nauc_recall_at_1_max": 0.598834, + "nauc_recall_at_1_std": -0.447766, + "nauc_recall_at_1_diff1": 0.87385, + "nauc_recall_at_3_max": 0.682446, + "nauc_recall_at_3_std": -0.508841, + "nauc_recall_at_3_diff1": 0.816658, + "nauc_recall_at_5_max": 0.71751, + "nauc_recall_at_5_std": -0.501612, + "nauc_recall_at_5_diff1": 0.816688, + "nauc_recall_at_10_max": 0.766946, + "nauc_recall_at_10_std": -0.404915, + "nauc_recall_at_10_diff1": 0.817849, + "nauc_recall_at_20_max": 0.826597, + "nauc_recall_at_20_std": -0.346109, + "nauc_recall_at_20_diff1": 0.824082, + "nauc_recall_at_100_max": 0.87944, + "nauc_recall_at_100_std": 0.127732, + "nauc_recall_at_100_diff1": 0.806379, + "nauc_recall_at_1000_max": 0.889703, + "nauc_recall_at_1000_std": 0.414781, + "nauc_recall_at_1000_diff1": 0.734081, + "nauc_precision_at_1_max": 0.598834, + "nauc_precision_at_1_std": -0.447766, + "nauc_precision_at_1_diff1": 0.87385, + "nauc_precision_at_3_max": 0.682446, + "nauc_precision_at_3_std": -0.508841, + "nauc_precision_at_3_diff1": 0.816658, + "nauc_precision_at_5_max": 0.71751, + "nauc_precision_at_5_std": -0.501612, + "nauc_precision_at_5_diff1": 0.816688, + "nauc_precision_at_10_max": 0.766946, + "nauc_precision_at_10_std": -0.404915, + "nauc_precision_at_10_diff1": 0.817849, + "nauc_precision_at_20_max": 0.826597, + "nauc_precision_at_20_std": -0.346109, + "nauc_precision_at_20_diff1": 0.824082, + "nauc_precision_at_100_max": 0.87944, + "nauc_precision_at_100_std": 0.127732, + "nauc_precision_at_100_diff1": 0.806379, + "nauc_precision_at_1000_max": 0.889703, + "nauc_precision_at_1000_std": 0.414781, + "nauc_precision_at_1000_diff1": 0.734081, + "nauc_mrr_at_1_max": 0.598834, + "nauc_mrr_at_1_std": -0.447766, + "nauc_mrr_at_1_diff1": 0.87385, + "nauc_mrr_at_3_max": 0.627529, + "nauc_mrr_at_3_std": -0.470975, + "nauc_mrr_at_3_diff1": 0.855477, + "nauc_mrr_at_5_max": 0.629334, + "nauc_mrr_at_5_std": -0.468663, + "nauc_mrr_at_5_diff1": 0.857288, + "nauc_mrr_at_10_max": 0.630316, + "nauc_mrr_at_10_std": -0.463083, + "nauc_mrr_at_10_diff1": 0.858146, + "nauc_mrr_at_20_max": 0.630139, + "nauc_mrr_at_20_std": -0.462541, + "nauc_mrr_at_20_diff1": 0.858622, + "nauc_mrr_at_100_max": 0.629519, + "nauc_mrr_at_100_std": -0.461783, + "nauc_mrr_at_100_diff1": 0.858677, + "nauc_mrr_at_1000_max": 0.629434, + "nauc_mrr_at_1000_std": -0.461908, + "nauc_mrr_at_1000_diff1": 0.858685, + "main_score": 0.88316, + "hf_subset": "go", + "languages": [ + "go-Code" + ] + }, + { + "ndcg_at_1": 0.6701, + "ndcg_at_3": 0.75089, + "ndcg_at_5": 0.76443, + "ndcg_at_10": 0.77677, + "ndcg_at_20": 0.78425, + "ndcg_at_100": 0.79204, + "ndcg_at_1000": 0.79566, + "map_at_1": 0.6701, + "map_at_3": 0.73183, + "map_at_5": 0.73924, + "map_at_10": 0.74435, + "map_at_20": 0.74643, + "map_at_100": 0.7475, + "map_at_1000": 0.74762, + "recall_at_1": 0.6701, + "recall_at_3": 0.80571, + "recall_at_5": 0.83902, + "recall_at_10": 0.87708, + "recall_at_20": 0.90642, + "recall_at_100": 0.94845, + "recall_at_1000": 0.9778, + "precision_at_1": 0.6701, + "precision_at_3": 0.26857, + "precision_at_5": 0.1678, + "precision_at_10": 0.08771, + "precision_at_20": 0.04532, + "precision_at_100": 0.00948, + "precision_at_1000": 0.00098, + "mrr_at_1": 0.670103, + "mrr_at_3": 0.731827, + "mrr_at_5": 0.739241, + "mrr_at_10": 0.744351, + "mrr_at_20": 0.746429, + "mrr_at_100": 0.747502, + "mrr_at_1000": 0.74762, + "nauc_ndcg_at_1_max": 0.68131, + "nauc_ndcg_at_1_std": -0.0532, + "nauc_ndcg_at_1_diff1": 0.732457, + "nauc_ndcg_at_3_max": 0.710688, + "nauc_ndcg_at_3_std": -0.002522, + "nauc_ndcg_at_3_diff1": 0.695234, + "nauc_ndcg_at_5_max": 0.70899, + "nauc_ndcg_at_5_std": 0.009805, + "nauc_ndcg_at_5_diff1": 0.691851, + "nauc_ndcg_at_10_max": 0.707782, + "nauc_ndcg_at_10_std": 0.017979, + "nauc_ndcg_at_10_diff1": 0.690853, + "nauc_ndcg_at_20_max": 0.704298, + "nauc_ndcg_at_20_std": 0.016453, + "nauc_ndcg_at_20_diff1": 0.690411, + "nauc_ndcg_at_100_max": 0.70265, + "nauc_ndcg_at_100_std": 0.019071, + "nauc_ndcg_at_100_diff1": 0.692558, + "nauc_ndcg_at_1000_max": 0.702446, + "nauc_ndcg_at_1000_std": 0.013112, + "nauc_ndcg_at_1000_diff1": 0.693983, + "nauc_map_at_1_max": 0.68131, + "nauc_map_at_1_std": -0.0532, + "nauc_map_at_1_diff1": 0.732457, + "nauc_map_at_3_max": 0.702763, + "nauc_map_at_3_std": -0.015795, + "nauc_map_at_3_diff1": 0.704926, + "nauc_map_at_5_max": 0.701594, + "nauc_map_at_5_std": -0.0104, + "nauc_map_at_5_diff1": 0.703395, + "nauc_map_at_10_max": 0.700988, + "nauc_map_at_10_std": -0.00788, + "nauc_map_at_10_diff1": 0.703371, + "nauc_map_at_20_max": 0.700109, + "nauc_map_at_20_std": -0.008558, + "nauc_map_at_20_diff1": 0.703417, + "nauc_map_at_100_max": 0.700012, + "nauc_map_at_100_std": -0.008048, + "nauc_map_at_100_diff1": 0.703709, + "nauc_map_at_1000_max": 0.699981, + "nauc_map_at_1000_std": -0.008208, + "nauc_map_at_1000_diff1": 0.70373, + "nauc_recall_at_1_max": 0.68131, + "nauc_recall_at_1_std": -0.0532, + "nauc_recall_at_1_diff1": 0.732457, + "nauc_recall_at_3_max": 0.739782, + "nauc_recall_at_3_std": 0.045979, + "nauc_recall_at_3_diff1": 0.659851, + "nauc_recall_at_5_max": 0.740154, + "nauc_recall_at_5_std": 0.099034, + "nauc_recall_at_5_diff1": 0.642485, + "nauc_recall_at_10_max": 0.742775, + "nauc_recall_at_10_std": 0.165964, + "nauc_recall_at_10_diff1": 0.622749, + "nauc_recall_at_20_max": 0.72455, + "nauc_recall_at_20_std": 0.19708, + "nauc_recall_at_20_diff1": 0.599214, + "nauc_recall_at_100_max": 0.704559, + "nauc_recall_at_100_std": 0.375339, + "nauc_recall_at_100_diff1": 0.568819, + "nauc_recall_at_1000_max": 0.707216, + "nauc_recall_at_1000_std": 0.450448, + "nauc_recall_at_1000_diff1": 0.513956, + "nauc_precision_at_1_max": 0.68131, + "nauc_precision_at_1_std": -0.0532, + "nauc_precision_at_1_diff1": 0.732457, + "nauc_precision_at_3_max": 0.739782, + "nauc_precision_at_3_std": 0.045979, + "nauc_precision_at_3_diff1": 0.659851, + "nauc_precision_at_5_max": 0.740154, + "nauc_precision_at_5_std": 0.099034, + "nauc_precision_at_5_diff1": 0.642485, + "nauc_precision_at_10_max": 0.742775, + "nauc_precision_at_10_std": 0.165964, + "nauc_precision_at_10_diff1": 0.622749, + "nauc_precision_at_20_max": 0.72455, + "nauc_precision_at_20_std": 0.19708, + "nauc_precision_at_20_diff1": 0.599214, + "nauc_precision_at_100_max": 0.704559, + "nauc_precision_at_100_std": 0.375339, + "nauc_precision_at_100_diff1": 0.568819, + "nauc_precision_at_1000_max": 0.707216, + "nauc_precision_at_1000_std": 0.450448, + "nauc_precision_at_1000_diff1": 0.513956, + "nauc_mrr_at_1_max": 0.68131, + "nauc_mrr_at_1_std": -0.0532, + "nauc_mrr_at_1_diff1": 0.732457, + "nauc_mrr_at_3_max": 0.702763, + "nauc_mrr_at_3_std": -0.015795, + "nauc_mrr_at_3_diff1": 0.704926, + "nauc_mrr_at_5_max": 0.701594, + "nauc_mrr_at_5_std": -0.0104, + "nauc_mrr_at_5_diff1": 0.703395, + "nauc_mrr_at_10_max": 0.700988, + "nauc_mrr_at_10_std": -0.00788, + "nauc_mrr_at_10_diff1": 0.703371, + "nauc_mrr_at_20_max": 0.700109, + "nauc_mrr_at_20_std": -0.008558, + "nauc_mrr_at_20_diff1": 0.703417, + "nauc_mrr_at_100_max": 0.700012, + "nauc_mrr_at_100_std": -0.008048, + "nauc_mrr_at_100_diff1": 0.703709, + "nauc_mrr_at_1000_max": 0.699981, + "nauc_mrr_at_1000_std": -0.008208, + "nauc_mrr_at_1000_diff1": 0.70373, + "main_score": 0.77677, + "hf_subset": "ruby", + "languages": [ + "ruby-Code" + ] + }, + { + "ndcg_at_1": 0.75098, + "ndcg_at_3": 0.81415, + "ndcg_at_5": 0.82465, + "ndcg_at_10": 0.83266, + "ndcg_at_20": 0.83753, + "ndcg_at_100": 0.843, + "ndcg_at_1000": 0.84591, + "map_at_1": 0.75098, + "map_at_3": 0.79935, + "map_at_5": 0.80518, + "map_at_10": 0.8085, + "map_at_20": 0.80984, + "map_at_100": 0.81061, + "map_at_1000": 0.81072, + "recall_at_1": 0.75098, + "recall_at_3": 0.85669, + "recall_at_5": 0.88215, + "recall_at_10": 0.90689, + "recall_at_20": 0.92606, + "recall_at_100": 0.95536, + "recall_at_1000": 0.97864, + "precision_at_1": 0.75098, + "precision_at_3": 0.28556, + "precision_at_5": 0.17643, + "precision_at_10": 0.09069, + "precision_at_20": 0.0463, + "precision_at_100": 0.00955, + "precision_at_1000": 0.00098, + "mrr_at_1": 0.750981, + "mrr_at_3": 0.799346, + "mrr_at_5": 0.805183, + "mrr_at_10": 0.808496, + "mrr_at_20": 0.809843, + "mrr_at_100": 0.810612, + "mrr_at_1000": 0.810716, + "nauc_ndcg_at_1_max": 0.686822, + "nauc_ndcg_at_1_std": -0.1433, + "nauc_ndcg_at_1_diff1": 0.835391, + "nauc_ndcg_at_3_max": 0.743447, + "nauc_ndcg_at_3_std": -0.106865, + "nauc_ndcg_at_3_diff1": 0.806924, + "nauc_ndcg_at_5_max": 0.74233, + "nauc_ndcg_at_5_std": -0.092893, + "nauc_ndcg_at_5_diff1": 0.803505, + "nauc_ndcg_at_10_max": 0.73917, + "nauc_ndcg_at_10_std": -0.081314, + "nauc_ndcg_at_10_diff1": 0.801846, + "nauc_ndcg_at_20_max": 0.738259, + "nauc_ndcg_at_20_std": -0.074164, + "nauc_ndcg_at_20_diff1": 0.803183, + "nauc_ndcg_at_100_max": 0.736004, + "nauc_ndcg_at_100_std": -0.074771, + "nauc_ndcg_at_100_diff1": 0.805275, + "nauc_ndcg_at_1000_max": 0.734208, + "nauc_ndcg_at_1000_std": -0.080444, + "nauc_ndcg_at_1000_diff1": 0.806596, + "nauc_map_at_1_max": 0.686822, + "nauc_map_at_1_std": -0.1433, + "nauc_map_at_1_diff1": 0.835391, + "nauc_map_at_3_max": 0.728221, + "nauc_map_at_3_std": -0.117674, + "nauc_map_at_3_diff1": 0.814403, + "nauc_map_at_5_max": 0.727231, + "nauc_map_at_5_std": -0.111054, + "nauc_map_at_5_diff1": 0.812872, + "nauc_map_at_10_max": 0.725743, + "nauc_map_at_10_std": -0.107111, + "nauc_map_at_10_diff1": 0.812322, + "nauc_map_at_20_max": 0.725401, + "nauc_map_at_20_std": -0.10569, + "nauc_map_at_20_diff1": 0.812699, + "nauc_map_at_100_max": 0.725065, + "nauc_map_at_100_std": -0.105702, + "nauc_map_at_100_diff1": 0.812939, + "nauc_map_at_1000_max": 0.725001, + "nauc_map_at_1000_std": -0.105859, + "nauc_map_at_1000_diff1": 0.812991, + "nauc_recall_at_1_max": 0.686822, + "nauc_recall_at_1_std": -0.1433, + "nauc_recall_at_1_diff1": 0.835391, + "nauc_recall_at_3_max": 0.801437, + "nauc_recall_at_3_std": -0.065093, + "nauc_recall_at_3_diff1": 0.778541, + "nauc_recall_at_5_max": 0.808685, + "nauc_recall_at_5_std": -0.008408, + "nauc_recall_at_5_diff1": 0.761503, + "nauc_recall_at_10_max": 0.809148, + "nauc_recall_at_10_std": 0.071672, + "nauc_recall_at_10_diff1": 0.743842, + "nauc_recall_at_20_max": 0.820349, + "nauc_recall_at_20_std": 0.170252, + "nauc_recall_at_20_diff1": 0.739967, + "nauc_recall_at_100_max": 0.8357, + "nauc_recall_at_100_std": 0.307906, + "nauc_recall_at_100_diff1": 0.737593, + "nauc_recall_at_1000_max": 0.85116, + "nauc_recall_at_1000_std": 0.411397, + "nauc_recall_at_1000_diff1": 0.730309, + "nauc_precision_at_1_max": 0.686822, + "nauc_precision_at_1_std": -0.1433, + "nauc_precision_at_1_diff1": 0.835391, + "nauc_precision_at_3_max": 0.801437, + "nauc_precision_at_3_std": -0.065093, + "nauc_precision_at_3_diff1": 0.778541, + "nauc_precision_at_5_max": 0.808685, + "nauc_precision_at_5_std": -0.008408, + "nauc_precision_at_5_diff1": 0.761503, + "nauc_precision_at_10_max": 0.809148, + "nauc_precision_at_10_std": 0.071672, + "nauc_precision_at_10_diff1": 0.743842, + "nauc_precision_at_20_max": 0.820349, + "nauc_precision_at_20_std": 0.170252, + "nauc_precision_at_20_diff1": 0.739967, + "nauc_precision_at_100_max": 0.8357, + "nauc_precision_at_100_std": 0.307906, + "nauc_precision_at_100_diff1": 0.737593, + "nauc_precision_at_1000_max": 0.85116, + "nauc_precision_at_1000_std": 0.411397, + "nauc_precision_at_1000_diff1": 0.730309, + "nauc_mrr_at_1_max": 0.686822, + "nauc_mrr_at_1_std": -0.1433, + "nauc_mrr_at_1_diff1": 0.835391, + "nauc_mrr_at_3_max": 0.728221, + "nauc_mrr_at_3_std": -0.117674, + "nauc_mrr_at_3_diff1": 0.814403, + "nauc_mrr_at_5_max": 0.727231, + "nauc_mrr_at_5_std": -0.111054, + "nauc_mrr_at_5_diff1": 0.812872, + "nauc_mrr_at_10_max": 0.725743, + "nauc_mrr_at_10_std": -0.107111, + "nauc_mrr_at_10_diff1": 0.812322, + "nauc_mrr_at_20_max": 0.725401, + "nauc_mrr_at_20_std": -0.10569, + "nauc_mrr_at_20_diff1": 0.812699, + "nauc_mrr_at_100_max": 0.725065, + "nauc_mrr_at_100_std": -0.105702, + "nauc_mrr_at_100_diff1": 0.812939, + "nauc_mrr_at_1000_max": 0.725001, + "nauc_mrr_at_1000_std": -0.105859, + "nauc_mrr_at_1000_diff1": 0.812991, + "main_score": 0.83266, + "hf_subset": "java", + "languages": [ + "java-Code" + ] + }, + { + "ndcg_at_1": 0.76495, + "ndcg_at_3": 0.83089, + "ndcg_at_5": 0.84214, + "ndcg_at_10": 0.85123, + "ndcg_at_20": 0.85638, + "ndcg_at_100": 0.86174, + "ndcg_at_1000": 0.86362, + "map_at_1": 0.76495, + "map_at_3": 0.81539, + "map_at_5": 0.82168, + "map_at_10": 0.82544, + "map_at_20": 0.82685, + "map_at_100": 0.8276, + "map_at_1000": 0.82767, + "recall_at_1": 0.76495, + "recall_at_3": 0.87548, + "recall_at_5": 0.9026, + "recall_at_10": 0.93064, + "recall_at_20": 0.95105, + "recall_at_100": 0.97973, + "recall_at_1000": 0.99458, + "precision_at_1": 0.76495, + "precision_at_3": 0.29183, + "precision_at_5": 0.18052, + "precision_at_10": 0.09306, + "precision_at_20": 0.04755, + "precision_at_100": 0.0098, + "precision_at_1000": 0.00099, + "mrr_at_1": 0.764949, + "mrr_at_3": 0.815387, + "mrr_at_5": 0.821677, + "mrr_at_10": 0.825441, + "mrr_at_20": 0.826847, + "mrr_at_100": 0.827602, + "mrr_at_1000": 0.827673, + "nauc_ndcg_at_1_max": 0.610916, + "nauc_ndcg_at_1_std": -0.26239, + "nauc_ndcg_at_1_diff1": 0.851584, + "nauc_ndcg_at_3_max": 0.671686, + "nauc_ndcg_at_3_std": -0.252447, + "nauc_ndcg_at_3_diff1": 0.824892, + "nauc_ndcg_at_5_max": 0.674197, + "nauc_ndcg_at_5_std": -0.237479, + "nauc_ndcg_at_5_diff1": 0.823402, + "nauc_ndcg_at_10_max": 0.674351, + "nauc_ndcg_at_10_std": -0.226304, + "nauc_ndcg_at_10_diff1": 0.825866, + "nauc_ndcg_at_20_max": 0.671843, + "nauc_ndcg_at_20_std": -0.220833, + "nauc_ndcg_at_20_diff1": 0.827535, + "nauc_ndcg_at_100_max": 0.666781, + "nauc_ndcg_at_100_std": -0.222602, + "nauc_ndcg_at_100_diff1": 0.829826, + "nauc_ndcg_at_1000_max": 0.663843, + "nauc_ndcg_at_1000_std": -0.229839, + "nauc_ndcg_at_1000_diff1": 0.830229, + "nauc_map_at_1_max": 0.610916, + "nauc_map_at_1_std": -0.26239, + "nauc_map_at_1_diff1": 0.851584, + "nauc_map_at_3_max": 0.655001, + "nauc_map_at_3_std": -0.255911, + "nauc_map_at_3_diff1": 0.83228, + "nauc_map_at_5_max": 0.655743, + "nauc_map_at_5_std": -0.24853, + "nauc_map_at_5_diff1": 0.831861, + "nauc_map_at_10_max": 0.655401, + "nauc_map_at_10_std": -0.244956, + "nauc_map_at_10_diff1": 0.832961, + "nauc_map_at_20_max": 0.654677, + "nauc_map_at_20_std": -0.243868, + "nauc_map_at_20_diff1": 0.833388, + "nauc_map_at_100_max": 0.654054, + "nauc_map_at_100_std": -0.244031, + "nauc_map_at_100_diff1": 0.833658, + "nauc_map_at_1000_max": 0.653965, + "nauc_map_at_1000_std": -0.244235, + "nauc_map_at_1000_diff1": 0.833673, + "nauc_recall_at_1_max": 0.610916, + "nauc_recall_at_1_std": -0.26239, + "nauc_recall_at_1_diff1": 0.851584, + "nauc_recall_at_3_max": 0.738669, + "nauc_recall_at_3_std": -0.238074, + "nauc_recall_at_3_diff1": 0.795192, + "nauc_recall_at_5_max": 0.764026, + "nauc_recall_at_5_std": -0.179609, + "nauc_recall_at_5_diff1": 0.781868, + "nauc_recall_at_10_max": 0.800916, + "nauc_recall_at_10_std": -0.085169, + "nauc_recall_at_10_diff1": 0.780036, + "nauc_recall_at_20_max": 0.826076, + "nauc_recall_at_20_std": 0.032991, + "nauc_recall_at_20_diff1": 0.779473, + "nauc_recall_at_100_max": 0.867964, + "nauc_recall_at_100_std": 0.314925, + "nauc_recall_at_100_diff1": 0.79102, + "nauc_recall_at_1000_max": 0.869971, + "nauc_recall_at_1000_std": 0.421816, + "nauc_recall_at_1000_diff1": 0.754558, + "nauc_precision_at_1_max": 0.610916, + "nauc_precision_at_1_std": -0.26239, + "nauc_precision_at_1_diff1": 0.851584, + "nauc_precision_at_3_max": 0.738669, + "nauc_precision_at_3_std": -0.238074, + "nauc_precision_at_3_diff1": 0.795192, + "nauc_precision_at_5_max": 0.764026, + "nauc_precision_at_5_std": -0.179609, + "nauc_precision_at_5_diff1": 0.781868, + "nauc_precision_at_10_max": 0.800916, + "nauc_precision_at_10_std": -0.085169, + "nauc_precision_at_10_diff1": 0.780036, + "nauc_precision_at_20_max": 0.826076, + "nauc_precision_at_20_std": 0.032991, + "nauc_precision_at_20_diff1": 0.779473, + "nauc_precision_at_100_max": 0.867964, + "nauc_precision_at_100_std": 0.314925, + "nauc_precision_at_100_diff1": 0.79102, + "nauc_precision_at_1000_max": 0.869971, + "nauc_precision_at_1000_std": 0.421816, + "nauc_precision_at_1000_diff1": 0.754558, + "nauc_mrr_at_1_max": 0.610916, + "nauc_mrr_at_1_std": -0.26239, + "nauc_mrr_at_1_diff1": 0.851584, + "nauc_mrr_at_3_max": 0.655001, + "nauc_mrr_at_3_std": -0.255911, + "nauc_mrr_at_3_diff1": 0.83228, + "nauc_mrr_at_5_max": 0.655743, + "nauc_mrr_at_5_std": -0.24853, + "nauc_mrr_at_5_diff1": 0.831861, + "nauc_mrr_at_10_max": 0.655401, + "nauc_mrr_at_10_std": -0.244956, + "nauc_mrr_at_10_diff1": 0.832961, + "nauc_mrr_at_20_max": 0.654677, + "nauc_mrr_at_20_std": -0.243868, + "nauc_mrr_at_20_diff1": 0.833388, + "nauc_mrr_at_100_max": 0.654054, + "nauc_mrr_at_100_std": -0.244031, + "nauc_mrr_at_100_diff1": 0.833658, + "nauc_mrr_at_1000_max": 0.653965, + "nauc_mrr_at_1000_std": -0.244235, + "nauc_mrr_at_1000_diff1": 0.833673, + "main_score": 0.85123, + "hf_subset": "php", + "languages": [ + "php-Code" + ] + } + ] + }, + "evaluation_time": 441.71198749542236, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackAndroidRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackAndroidRetrieval.json new file mode 100644 index 0000000000..0f591fd972 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackAndroidRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "f46a197baaae43b4f621051089b82a364682dfeb", + "task_name": "CQADupstackAndroidRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.43348, + "ndcg_at_3": 0.47299, + "ndcg_at_5": 0.49808, + "ndcg_at_10": 0.5265, + "ndcg_at_20": 0.55037, + "ndcg_at_100": 0.57863, + "ndcg_at_1000": 0.59742, + "map_at_1": 0.35003, + "map_at_3": 0.42497, + "map_at_5": 0.4462, + "map_at_10": 0.46288, + "map_at_20": 0.47219, + "map_at_100": 0.47854, + "map_at_1000": 0.47972, + "recall_at_1": 0.35003, + "recall_at_3": 0.48863, + "recall_at_5": 0.55687, + "recall_at_10": 0.64298, + "recall_at_20": 0.72741, + "recall_at_100": 0.85343, + "recall_at_1000": 0.97352, + "precision_at_1": 0.43348, + "precision_at_3": 0.2227, + "precision_at_5": 0.1628, + "precision_at_10": 0.09928, + "precision_at_20": 0.05937, + "precision_at_100": 0.01554, + "precision_at_1000": 0.002, + "mrr_at_1": 0.433476, + "mrr_at_3": 0.499762, + "mrr_at_5": 0.516571, + "mrr_at_10": 0.5274, + "mrr_at_20": 0.532506, + "mrr_at_100": 0.534776, + "mrr_at_1000": 0.535223, + "nauc_ndcg_at_1_max": 0.385771, + "nauc_ndcg_at_1_std": -0.113596, + "nauc_ndcg_at_1_diff1": 0.543297, + "nauc_ndcg_at_3_max": 0.368208, + "nauc_ndcg_at_3_std": -0.101403, + "nauc_ndcg_at_3_diff1": 0.485733, + "nauc_ndcg_at_5_max": 0.375041, + "nauc_ndcg_at_5_std": -0.084839, + "nauc_ndcg_at_5_diff1": 0.475665, + "nauc_ndcg_at_10_max": 0.384833, + "nauc_ndcg_at_10_std": -0.063765, + "nauc_ndcg_at_10_diff1": 0.477584, + "nauc_ndcg_at_20_max": 0.388884, + "nauc_ndcg_at_20_std": -0.048903, + "nauc_ndcg_at_20_diff1": 0.478039, + "nauc_ndcg_at_100_max": 0.388899, + "nauc_ndcg_at_100_std": -0.045543, + "nauc_ndcg_at_100_diff1": 0.48481, + "nauc_ndcg_at_1000_max": 0.392826, + "nauc_ndcg_at_1000_std": -0.053571, + "nauc_ndcg_at_1000_diff1": 0.489757, + "nauc_map_at_1_max": 0.338852, + "nauc_map_at_1_std": -0.1091, + "nauc_map_at_1_diff1": 0.555676, + "nauc_map_at_3_max": 0.359646, + "nauc_map_at_3_std": -0.099787, + "nauc_map_at_3_diff1": 0.519482, + "nauc_map_at_5_max": 0.371112, + "nauc_map_at_5_std": -0.089962, + "nauc_map_at_5_diff1": 0.513019, + "nauc_map_at_10_max": 0.379638, + "nauc_map_at_10_std": -0.080184, + "nauc_map_at_10_diff1": 0.510559, + "nauc_map_at_20_max": 0.382164, + "nauc_map_at_20_std": -0.074705, + "nauc_map_at_20_diff1": 0.508835, + "nauc_map_at_100_max": 0.383195, + "nauc_map_at_100_std": -0.074139, + "nauc_map_at_100_diff1": 0.509352, + "nauc_map_at_1000_max": 0.383352, + "nauc_map_at_1000_std": -0.0746, + "nauc_map_at_1000_diff1": 0.509273, + "nauc_recall_at_1_max": 0.338852, + "nauc_recall_at_1_std": -0.1091, + "nauc_recall_at_1_diff1": 0.555676, + "nauc_recall_at_3_max": 0.336738, + "nauc_recall_at_3_std": -0.087676, + "nauc_recall_at_3_diff1": 0.444386, + "nauc_recall_at_5_max": 0.339798, + "nauc_recall_at_5_std": -0.053578, + "nauc_recall_at_5_diff1": 0.398958, + "nauc_recall_at_10_max": 0.355395, + "nauc_recall_at_10_std": 0.013892, + "nauc_recall_at_10_diff1": 0.374608, + "nauc_recall_at_20_max": 0.363714, + "nauc_recall_at_20_std": 0.087795, + "nauc_recall_at_20_diff1": 0.356828, + "nauc_recall_at_100_max": 0.337428, + "nauc_recall_at_100_std": 0.201305, + "nauc_recall_at_100_diff1": 0.349063, + "nauc_recall_at_1000_max": 0.497309, + "nauc_recall_at_1000_std": 0.654219, + "nauc_recall_at_1000_diff1": 0.406209, + "nauc_precision_at_1_max": 0.385771, + "nauc_precision_at_1_std": -0.113596, + "nauc_precision_at_1_diff1": 0.543297, + "nauc_precision_at_3_max": 0.328791, + "nauc_precision_at_3_std": -0.075414, + "nauc_precision_at_3_diff1": 0.296826, + "nauc_precision_at_5_max": 0.309749, + "nauc_precision_at_5_std": -0.025772, + "nauc_precision_at_5_diff1": 0.182252, + "nauc_precision_at_10_max": 0.260241, + "nauc_precision_at_10_std": 0.022944, + "nauc_precision_at_10_diff1": 0.077485, + "nauc_precision_at_20_max": 0.186782, + "nauc_precision_at_20_std": 0.051483, + "nauc_precision_at_20_diff1": -0.028997, + "nauc_precision_at_100_max": 0.041248, + "nauc_precision_at_100_std": 0.012495, + "nauc_precision_at_100_diff1": -0.133671, + "nauc_precision_at_1000_max": -0.076422, + "nauc_precision_at_1000_std": -0.076125, + "nauc_precision_at_1000_diff1": -0.233152, + "nauc_mrr_at_1_max": 0.385771, + "nauc_mrr_at_1_std": -0.113596, + "nauc_mrr_at_1_diff1": 0.543297, + "nauc_mrr_at_3_max": 0.383154, + "nauc_mrr_at_3_std": -0.103418, + "nauc_mrr_at_3_diff1": 0.49306, + "nauc_mrr_at_5_max": 0.386482, + "nauc_mrr_at_5_std": -0.096454, + "nauc_mrr_at_5_diff1": 0.486042, + "nauc_mrr_at_10_max": 0.388932, + "nauc_mrr_at_10_std": -0.090354, + "nauc_mrr_at_10_diff1": 0.487027, + "nauc_mrr_at_20_max": 0.388543, + "nauc_mrr_at_20_std": -0.086836, + "nauc_mrr_at_20_diff1": 0.489009, + "nauc_mrr_at_100_max": 0.38829, + "nauc_mrr_at_100_std": -0.087135, + "nauc_mrr_at_100_diff1": 0.489577, + "nauc_mrr_at_1000_max": 0.388445, + "nauc_mrr_at_1000_std": -0.08713, + "nauc_mrr_at_1000_diff1": 0.4897, + "main_score": 0.5265, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 3.2247705459594727, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackEnglishRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackEnglishRetrieval.json new file mode 100644 index 0000000000..bf9d0629c8 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackEnglishRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "ad9991cb51e31e31e430383c75ffb2885547b5f0", + "task_name": "CQADupstackEnglishRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.41338, + "ndcg_at_3": 0.45761, + "ndcg_at_5": 0.47919, + "ndcg_at_10": 0.49934, + "ndcg_at_20": 0.51623, + "ndcg_at_100": 0.54418, + "ndcg_at_1000": 0.56289, + "map_at_1": 0.32389, + "map_at_3": 0.40641, + "map_at_5": 0.42549, + "map_at_10": 0.43805, + "map_at_20": 0.44516, + "map_at_100": 0.45157, + "map_at_1000": 0.45284, + "recall_at_1": 0.32389, + "recall_at_3": 0.47745, + "recall_at_5": 0.53848, + "recall_at_10": 0.60258, + "recall_at_20": 0.66458, + "recall_at_100": 0.7923, + "recall_at_1000": 0.90867, + "precision_at_1": 0.41338, + "precision_at_3": 0.22335, + "precision_at_5": 0.15924, + "precision_at_10": 0.09503, + "precision_at_20": 0.0558, + "precision_at_100": 0.01529, + "precision_at_1000": 0.00198, + "mrr_at_1": 0.413376, + "mrr_at_3": 0.48259, + "mrr_at_5": 0.496125, + "mrr_at_10": 0.5043, + "mrr_at_20": 0.508001, + "mrr_at_100": 0.510501, + "mrr_at_1000": 0.510917, + "nauc_ndcg_at_1_max": 0.490937, + "nauc_ndcg_at_1_std": 0.045345, + "nauc_ndcg_at_1_diff1": 0.540431, + "nauc_ndcg_at_3_max": 0.50445, + "nauc_ndcg_at_3_std": 0.068706, + "nauc_ndcg_at_3_diff1": 0.514311, + "nauc_ndcg_at_5_max": 0.507483, + "nauc_ndcg_at_5_std": 0.073721, + "nauc_ndcg_at_5_diff1": 0.512674, + "nauc_ndcg_at_10_max": 0.515912, + "nauc_ndcg_at_10_std": 0.09034, + "nauc_ndcg_at_10_diff1": 0.513074, + "nauc_ndcg_at_20_max": 0.520932, + "nauc_ndcg_at_20_std": 0.097695, + "nauc_ndcg_at_20_diff1": 0.51641, + "nauc_ndcg_at_100_max": 0.523772, + "nauc_ndcg_at_100_std": 0.111663, + "nauc_ndcg_at_100_diff1": 0.513543, + "nauc_ndcg_at_1000_max": 0.519772, + "nauc_ndcg_at_1000_std": 0.112374, + "nauc_ndcg_at_1000_diff1": 0.510777, + "nauc_map_at_1_max": 0.410926, + "nauc_map_at_1_std": -0.032867, + "nauc_map_at_1_diff1": 0.575962, + "nauc_map_at_3_max": 0.472694, + "nauc_map_at_3_std": 0.020319, + "nauc_map_at_3_diff1": 0.542982, + "nauc_map_at_5_max": 0.485385, + "nauc_map_at_5_std": 0.032362, + "nauc_map_at_5_diff1": 0.538315, + "nauc_map_at_10_max": 0.493485, + "nauc_map_at_10_std": 0.044975, + "nauc_map_at_10_diff1": 0.536283, + "nauc_map_at_20_max": 0.497242, + "nauc_map_at_20_std": 0.050481, + "nauc_map_at_20_diff1": 0.535834, + "nauc_map_at_100_max": 0.500296, + "nauc_map_at_100_std": 0.057242, + "nauc_map_at_100_diff1": 0.533799, + "nauc_map_at_1000_max": 0.500645, + "nauc_map_at_1000_std": 0.058107, + "nauc_map_at_1000_diff1": 0.533534, + "nauc_recall_at_1_max": 0.410926, + "nauc_recall_at_1_std": -0.032867, + "nauc_recall_at_1_diff1": 0.575962, + "nauc_recall_at_3_max": 0.472087, + "nauc_recall_at_3_std": 0.058619, + "nauc_recall_at_3_diff1": 0.490395, + "nauc_recall_at_5_max": 0.483301, + "nauc_recall_at_5_std": 0.083457, + "nauc_recall_at_5_diff1": 0.46941, + "nauc_recall_at_10_max": 0.509232, + "nauc_recall_at_10_std": 0.141187, + "nauc_recall_at_10_diff1": 0.453997, + "nauc_recall_at_20_max": 0.523899, + "nauc_recall_at_20_std": 0.184053, + "nauc_recall_at_20_diff1": 0.447127, + "nauc_recall_at_100_max": 0.558499, + "nauc_recall_at_100_std": 0.322044, + "nauc_recall_at_100_diff1": 0.426082, + "nauc_recall_at_1000_max": 0.554781, + "nauc_recall_at_1000_std": 0.518818, + "nauc_recall_at_1000_diff1": 0.363726, + "nauc_precision_at_1_max": 0.490937, + "nauc_precision_at_1_std": 0.045345, + "nauc_precision_at_1_diff1": 0.540431, + "nauc_precision_at_3_max": 0.477237, + "nauc_precision_at_3_std": 0.173762, + "nauc_precision_at_3_diff1": 0.292933, + "nauc_precision_at_5_max": 0.430068, + "nauc_precision_at_5_std": 0.205837, + "nauc_precision_at_5_diff1": 0.197213, + "nauc_precision_at_10_max": 0.367994, + "nauc_precision_at_10_std": 0.252109, + "nauc_precision_at_10_diff1": 0.098705, + "nauc_precision_at_20_max": 0.304994, + "nauc_precision_at_20_std": 0.270097, + "nauc_precision_at_20_diff1": 0.028578, + "nauc_precision_at_100_max": 0.191305, + "nauc_precision_at_100_std": 0.299215, + "nauc_precision_at_100_diff1": -0.096253, + "nauc_precision_at_1000_max": 0.06439, + "nauc_precision_at_1000_std": 0.245539, + "nauc_precision_at_1000_diff1": -0.175336, + "nauc_mrr_at_1_max": 0.490937, + "nauc_mrr_at_1_std": 0.045345, + "nauc_mrr_at_1_diff1": 0.540431, + "nauc_mrr_at_3_max": 0.51371, + "nauc_mrr_at_3_std": 0.082402, + "nauc_mrr_at_3_diff1": 0.51102, + "nauc_mrr_at_5_max": 0.51427, + "nauc_mrr_at_5_std": 0.087217, + "nauc_mrr_at_5_diff1": 0.50861, + "nauc_mrr_at_10_max": 0.517043, + "nauc_mrr_at_10_std": 0.092814, + "nauc_mrr_at_10_diff1": 0.508882, + "nauc_mrr_at_20_max": 0.517856, + "nauc_mrr_at_20_std": 0.095097, + "nauc_mrr_at_20_diff1": 0.509149, + "nauc_mrr_at_100_max": 0.51731, + "nauc_mrr_at_100_std": 0.095318, + "nauc_mrr_at_100_diff1": 0.508719, + "nauc_mrr_at_1000_max": 0.51718, + "nauc_mrr_at_1000_std": 0.095177, + "nauc_mrr_at_1000_diff1": 0.508762, + "main_score": 0.49934, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 6.088695526123047, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackGamingRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackGamingRetrieval.json new file mode 100644 index 0000000000..a63a3e1a30 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackGamingRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "4885aa143210c98657558c04aaf3dc47cfb54340", + "task_name": "CQADupstackGamingRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.47586, + "ndcg_at_3": 0.54847, + "ndcg_at_5": 0.57856, + "ndcg_at_10": 0.60396, + "ndcg_at_20": 0.62293, + "ndcg_at_100": 0.64379, + "ndcg_at_1000": 0.65325, + "map_at_1": 0.41336, + "map_at_3": 0.51017, + "map_at_5": 0.53116, + "map_at_10": 0.54453, + "map_at_20": 0.55128, + "map_at_100": 0.55501, + "map_at_1000": 0.5555, + "recall_at_1": 0.41336, + "recall_at_3": 0.5987, + "recall_at_5": 0.67162, + "recall_at_10": 0.74543, + "recall_at_20": 0.81486, + "recall_at_100": 0.91541, + "recall_at_1000": 0.982, + "precision_at_1": 0.47586, + "precision_at_3": 0.24535, + "precision_at_5": 0.17016, + "precision_at_10": 0.09724, + "precision_at_20": 0.05455, + "precision_at_100": 0.01263, + "precision_at_1000": 0.00138, + "mrr_at_1": 0.475862, + "mrr_at_3": 0.553396, + "mrr_at_5": 0.569195, + "mrr_at_10": 0.578038, + "mrr_at_20": 0.582262, + "mrr_at_100": 0.584618, + "mrr_at_1000": 0.584858, + "nauc_ndcg_at_1_max": 0.434516, + "nauc_ndcg_at_1_std": -0.045129, + "nauc_ndcg_at_1_diff1": 0.519005, + "nauc_ndcg_at_3_max": 0.423675, + "nauc_ndcg_at_3_std": -0.055235, + "nauc_ndcg_at_3_diff1": 0.468824, + "nauc_ndcg_at_5_max": 0.435119, + "nauc_ndcg_at_5_std": -0.038831, + "nauc_ndcg_at_5_diff1": 0.465, + "nauc_ndcg_at_10_max": 0.44807, + "nauc_ndcg_at_10_std": -0.018454, + "nauc_ndcg_at_10_diff1": 0.461703, + "nauc_ndcg_at_20_max": 0.449931, + "nauc_ndcg_at_20_std": -0.001848, + "nauc_ndcg_at_20_diff1": 0.459052, + "nauc_ndcg_at_100_max": 0.456798, + "nauc_ndcg_at_100_std": 0.005067, + "nauc_ndcg_at_100_diff1": 0.468934, + "nauc_ndcg_at_1000_max": 0.451372, + "nauc_ndcg_at_1000_std": -0.00556, + "nauc_ndcg_at_1000_diff1": 0.472366, + "nauc_map_at_1_max": 0.370894, + "nauc_map_at_1_std": -0.073412, + "nauc_map_at_1_diff1": 0.537315, + "nauc_map_at_3_max": 0.409226, + "nauc_map_at_3_std": -0.071679, + "nauc_map_at_3_diff1": 0.489034, + "nauc_map_at_5_max": 0.422141, + "nauc_map_at_5_std": -0.055822, + "nauc_map_at_5_diff1": 0.486392, + "nauc_map_at_10_max": 0.431454, + "nauc_map_at_10_std": -0.04492, + "nauc_map_at_10_diff1": 0.485106, + "nauc_map_at_20_max": 0.434171, + "nauc_map_at_20_std": -0.037662, + "nauc_map_at_20_diff1": 0.483927, + "nauc_map_at_100_max": 0.435838, + "nauc_map_at_100_std": -0.035103, + "nauc_map_at_100_diff1": 0.484614, + "nauc_map_at_1000_max": 0.435831, + "nauc_map_at_1000_std": -0.035352, + "nauc_map_at_1000_diff1": 0.484762, + "nauc_recall_at_1_max": 0.370894, + "nauc_recall_at_1_std": -0.073412, + "nauc_recall_at_1_diff1": 0.537315, + "nauc_recall_at_3_max": 0.393257, + "nauc_recall_at_3_std": -0.075882, + "nauc_recall_at_3_diff1": 0.421379, + "nauc_recall_at_5_max": 0.411353, + "nauc_recall_at_5_std": -0.035745, + "nauc_recall_at_5_diff1": 0.395484, + "nauc_recall_at_10_max": 0.4583, + "nauc_recall_at_10_std": 0.042987, + "nauc_recall_at_10_diff1": 0.365825, + "nauc_recall_at_20_max": 0.477911, + "nauc_recall_at_20_std": 0.152636, + "nauc_recall_at_20_diff1": 0.322423, + "nauc_recall_at_100_max": 0.612039, + "nauc_recall_at_100_std": 0.360867, + "nauc_recall_at_100_diff1": 0.372858, + "nauc_recall_at_1000_max": 0.660089, + "nauc_recall_at_1000_std": 0.499023, + "nauc_recall_at_1000_diff1": 0.491238, + "nauc_precision_at_1_max": 0.434516, + "nauc_precision_at_1_std": -0.045129, + "nauc_precision_at_1_diff1": 0.519005, + "nauc_precision_at_3_max": 0.389155, + "nauc_precision_at_3_std": 0.012751, + "nauc_precision_at_3_diff1": 0.240521, + "nauc_precision_at_5_max": 0.365872, + "nauc_precision_at_5_std": 0.090968, + "nauc_precision_at_5_diff1": 0.147316, + "nauc_precision_at_10_max": 0.340434, + "nauc_precision_at_10_std": 0.164187, + "nauc_precision_at_10_diff1": 0.059549, + "nauc_precision_at_20_max": 0.288192, + "nauc_precision_at_20_std": 0.242657, + "nauc_precision_at_20_diff1": -0.031, + "nauc_precision_at_100_max": 0.203126, + "nauc_precision_at_100_std": 0.287618, + "nauc_precision_at_100_diff1": -0.118901, + "nauc_precision_at_1000_max": 0.118736, + "nauc_precision_at_1000_std": 0.239765, + "nauc_precision_at_1000_diff1": -0.159422, + "nauc_mrr_at_1_max": 0.434516, + "nauc_mrr_at_1_std": -0.045129, + "nauc_mrr_at_1_diff1": 0.519005, + "nauc_mrr_at_3_max": 0.439976, + "nauc_mrr_at_3_std": -0.03227, + "nauc_mrr_at_3_diff1": 0.477614, + "nauc_mrr_at_5_max": 0.441938, + "nauc_mrr_at_5_std": -0.02746, + "nauc_mrr_at_5_diff1": 0.474706, + "nauc_mrr_at_10_max": 0.445588, + "nauc_mrr_at_10_std": -0.021094, + "nauc_mrr_at_10_diff1": 0.473778, + "nauc_mrr_at_20_max": 0.445323, + "nauc_mrr_at_20_std": -0.019186, + "nauc_mrr_at_20_diff1": 0.473611, + "nauc_mrr_at_100_max": 0.445963, + "nauc_mrr_at_100_std": -0.019177, + "nauc_mrr_at_100_diff1": 0.475042, + "nauc_mrr_at_1000_max": 0.44579, + "nauc_mrr_at_1000_std": -0.019497, + "nauc_mrr_at_1000_diff1": 0.475159, + "main_score": 0.60396, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 6.5216224193573, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackGisRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackGisRetrieval.json new file mode 100644 index 0000000000..898118fb2d --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackGisRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "5003b3064772da1887988e05400cf3806fe491f2", + "task_name": "CQADupstackGisRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.31299, + "ndcg_at_3": 0.37814, + "ndcg_at_5": 0.40701, + "ndcg_at_10": 0.436, + "ndcg_at_20": 0.45665, + "ndcg_at_100": 0.48521, + "ndcg_at_1000": 0.50406, + "map_at_1": 0.29022, + "map_at_3": 0.353, + "map_at_5": 0.36999, + "map_at_10": 0.38291, + "map_at_20": 0.38877, + "map_at_100": 0.3931, + "map_at_1000": 0.39392, + "recall_at_1": 0.29022, + "recall_at_3": 0.42384, + "recall_at_5": 0.49434, + "recall_at_10": 0.57887, + "recall_at_20": 0.65698, + "recall_at_100": 0.8013, + "recall_at_1000": 0.93883, + "precision_at_1": 0.31299, + "precision_at_3": 0.15782, + "precision_at_5": 0.11073, + "precision_at_10": 0.06633, + "precision_at_20": 0.03836, + "precision_at_100": 0.00959, + "precision_at_1000": 0.00116, + "mrr_at_1": 0.312994, + "mrr_at_3": 0.375518, + "mrr_at_5": 0.392072, + "mrr_at_10": 0.404246, + "mrr_at_20": 0.40942, + "mrr_at_100": 0.41293, + "mrr_at_1000": 0.413508, + "nauc_ndcg_at_1_max": 0.296754, + "nauc_ndcg_at_1_std": -0.12548, + "nauc_ndcg_at_1_diff1": 0.385818, + "nauc_ndcg_at_3_max": 0.282283, + "nauc_ndcg_at_3_std": -0.061322, + "nauc_ndcg_at_3_diff1": 0.322512, + "nauc_ndcg_at_5_max": 0.305721, + "nauc_ndcg_at_5_std": -0.042465, + "nauc_ndcg_at_5_diff1": 0.323164, + "nauc_ndcg_at_10_max": 0.30515, + "nauc_ndcg_at_10_std": -0.042313, + "nauc_ndcg_at_10_diff1": 0.316435, + "nauc_ndcg_at_20_max": 0.309273, + "nauc_ndcg_at_20_std": -0.030291, + "nauc_ndcg_at_20_diff1": 0.3076, + "nauc_ndcg_at_100_max": 0.318087, + "nauc_ndcg_at_100_std": -0.023713, + "nauc_ndcg_at_100_diff1": 0.315882, + "nauc_ndcg_at_1000_max": 0.312448, + "nauc_ndcg_at_1000_std": -0.029017, + "nauc_ndcg_at_1000_diff1": 0.319117, + "nauc_map_at_1_max": 0.280543, + "nauc_map_at_1_std": -0.13441, + "nauc_map_at_1_diff1": 0.404762, + "nauc_map_at_3_max": 0.280725, + "nauc_map_at_3_std": -0.079209, + "nauc_map_at_3_diff1": 0.342805, + "nauc_map_at_5_max": 0.29593, + "nauc_map_at_5_std": -0.068284, + "nauc_map_at_5_diff1": 0.34253, + "nauc_map_at_10_max": 0.297418, + "nauc_map_at_10_std": -0.067033, + "nauc_map_at_10_diff1": 0.339186, + "nauc_map_at_20_max": 0.298849, + "nauc_map_at_20_std": -0.063757, + "nauc_map_at_20_diff1": 0.337146, + "nauc_map_at_100_max": 0.300622, + "nauc_map_at_100_std": -0.062754, + "nauc_map_at_100_diff1": 0.338568, + "nauc_map_at_1000_max": 0.300417, + "nauc_map_at_1000_std": -0.062957, + "nauc_map_at_1000_diff1": 0.338745, + "nauc_recall_at_1_max": 0.280543, + "nauc_recall_at_1_std": -0.13441, + "nauc_recall_at_1_diff1": 0.404762, + "nauc_recall_at_3_max": 0.257656, + "nauc_recall_at_3_std": -0.021, + "nauc_recall_at_3_diff1": 0.272272, + "nauc_recall_at_5_max": 0.315655, + "nauc_recall_at_5_std": 0.024212, + "nauc_recall_at_5_diff1": 0.269105, + "nauc_recall_at_10_max": 0.312007, + "nauc_recall_at_10_std": 0.029949, + "nauc_recall_at_10_diff1": 0.244622, + "nauc_recall_at_20_max": 0.329873, + "nauc_recall_at_20_std": 0.094291, + "nauc_recall_at_20_diff1": 0.196121, + "nauc_recall_at_100_max": 0.410091, + "nauc_recall_at_100_std": 0.20571, + "nauc_recall_at_100_diff1": 0.212105, + "nauc_recall_at_1000_max": 0.417173, + "nauc_recall_at_1000_std": 0.470517, + "nauc_recall_at_1000_diff1": 0.151271, + "nauc_precision_at_1_max": 0.296754, + "nauc_precision_at_1_std": -0.12548, + "nauc_precision_at_1_diff1": 0.385818, + "nauc_precision_at_3_max": 0.303999, + "nauc_precision_at_3_std": 0.001598, + "nauc_precision_at_3_diff1": 0.233015, + "nauc_precision_at_5_max": 0.354382, + "nauc_precision_at_5_std": 0.044023, + "nauc_precision_at_5_diff1": 0.215111, + "nauc_precision_at_10_max": 0.331317, + "nauc_precision_at_10_std": 0.047369, + "nauc_precision_at_10_diff1": 0.154409, + "nauc_precision_at_20_max": 0.330461, + "nauc_precision_at_20_std": 0.102495, + "nauc_precision_at_20_diff1": 0.089982, + "nauc_precision_at_100_max": 0.283871, + "nauc_precision_at_100_std": 0.158617, + "nauc_precision_at_100_diff1": 0.028317, + "nauc_precision_at_1000_max": 0.127146, + "nauc_precision_at_1000_std": 0.128667, + "nauc_precision_at_1000_diff1": -0.089727, + "nauc_mrr_at_1_max": 0.296754, + "nauc_mrr_at_1_std": -0.12548, + "nauc_mrr_at_1_diff1": 0.385818, + "nauc_mrr_at_3_max": 0.291657, + "nauc_mrr_at_3_std": -0.0698, + "nauc_mrr_at_3_diff1": 0.332636, + "nauc_mrr_at_5_max": 0.304004, + "nauc_mrr_at_5_std": -0.059501, + "nauc_mrr_at_5_diff1": 0.333361, + "nauc_mrr_at_10_max": 0.302261, + "nauc_mrr_at_10_std": -0.062592, + "nauc_mrr_at_10_diff1": 0.331187, + "nauc_mrr_at_20_max": 0.302743, + "nauc_mrr_at_20_std": -0.060451, + "nauc_mrr_at_20_diff1": 0.329016, + "nauc_mrr_at_100_max": 0.303695, + "nauc_mrr_at_100_std": -0.059887, + "nauc_mrr_at_100_diff1": 0.330311, + "nauc_mrr_at_1000_max": 0.303485, + "nauc_mrr_at_1000_std": -0.060071, + "nauc_mrr_at_1000_diff1": 0.330473, + "main_score": 0.436, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 5.291266441345215, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackMathematicaRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackMathematicaRetrieval.json new file mode 100644 index 0000000000..0c38c30916 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackMathematicaRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "90fceea13679c63fe563ded68f3b6f06e50061de", + "task_name": "CQADupstackMathematicaRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.23383, + "ndcg_at_3": 0.28211, + "ndcg_at_5": 0.31462, + "ndcg_at_10": 0.33912, + "ndcg_at_20": 0.36276, + "ndcg_at_100": 0.39879, + "ndcg_at_1000": 0.42372, + "map_at_1": 0.18782, + "map_at_3": 0.2483, + "map_at_5": 0.26872, + "map_at_10": 0.28071, + "map_at_20": 0.28794, + "map_at_100": 0.2937, + "map_at_1000": 0.2948, + "recall_at_1": 0.18782, + "recall_at_3": 0.31591, + "recall_at_5": 0.39546, + "recall_at_10": 0.46712, + "recall_at_20": 0.55226, + "recall_at_100": 0.72325, + "recall_at_1000": 0.9, + "precision_at_1": 0.23383, + "precision_at_3": 0.13599, + "precision_at_5": 0.10473, + "precision_at_10": 0.06331, + "precision_at_20": 0.03812, + "precision_at_100": 0.01067, + "precision_at_1000": 0.0014, + "mrr_at_1": 0.233831, + "mrr_at_3": 0.301202, + "mrr_at_5": 0.321538, + "mrr_at_10": 0.330875, + "mrr_at_20": 0.336677, + "mrr_at_100": 0.340884, + "mrr_at_1000": 0.341453, + "nauc_ndcg_at_1_max": 0.231479, + "nauc_ndcg_at_1_std": 0.009344, + "nauc_ndcg_at_1_diff1": 0.284906, + "nauc_ndcg_at_3_max": 0.224569, + "nauc_ndcg_at_3_std": 0.020651, + "nauc_ndcg_at_3_diff1": 0.236746, + "nauc_ndcg_at_5_max": 0.215021, + "nauc_ndcg_at_5_std": 0.024169, + "nauc_ndcg_at_5_diff1": 0.233923, + "nauc_ndcg_at_10_max": 0.215588, + "nauc_ndcg_at_10_std": 0.034311, + "nauc_ndcg_at_10_diff1": 0.239517, + "nauc_ndcg_at_20_max": 0.225002, + "nauc_ndcg_at_20_std": 0.038323, + "nauc_ndcg_at_20_diff1": 0.235314, + "nauc_ndcg_at_100_max": 0.225902, + "nauc_ndcg_at_100_std": 0.055196, + "nauc_ndcg_at_100_diff1": 0.233093, + "nauc_ndcg_at_1000_max": 0.227916, + "nauc_ndcg_at_1000_std": 0.052008, + "nauc_ndcg_at_1000_diff1": 0.235723, + "nauc_map_at_1_max": 0.223814, + "nauc_map_at_1_std": 0.000691, + "nauc_map_at_1_diff1": 0.280122, + "nauc_map_at_3_max": 0.217168, + "nauc_map_at_3_std": 0.01789, + "nauc_map_at_3_diff1": 0.245133, + "nauc_map_at_5_max": 0.212302, + "nauc_map_at_5_std": 0.018875, + "nauc_map_at_5_diff1": 0.243812, + "nauc_map_at_10_max": 0.212113, + "nauc_map_at_10_std": 0.021982, + "nauc_map_at_10_diff1": 0.246115, + "nauc_map_at_20_max": 0.215752, + "nauc_map_at_20_std": 0.023157, + "nauc_map_at_20_diff1": 0.244647, + "nauc_map_at_100_max": 0.215938, + "nauc_map_at_100_std": 0.025717, + "nauc_map_at_100_diff1": 0.243236, + "nauc_map_at_1000_max": 0.216146, + "nauc_map_at_1000_std": 0.025756, + "nauc_map_at_1000_diff1": 0.243191, + "nauc_recall_at_1_max": 0.223814, + "nauc_recall_at_1_std": 0.000691, + "nauc_recall_at_1_diff1": 0.280122, + "nauc_recall_at_3_max": 0.209124, + "nauc_recall_at_3_std": 0.033582, + "nauc_recall_at_3_diff1": 0.203992, + "nauc_recall_at_5_max": 0.186654, + "nauc_recall_at_5_std": 0.039343, + "nauc_recall_at_5_diff1": 0.198366, + "nauc_recall_at_10_max": 0.186997, + "nauc_recall_at_10_std": 0.066913, + "nauc_recall_at_10_diff1": 0.209052, + "nauc_recall_at_20_max": 0.210399, + "nauc_recall_at_20_std": 0.077959, + "nauc_recall_at_20_diff1": 0.190918, + "nauc_recall_at_100_max": 0.218116, + "nauc_recall_at_100_std": 0.2036, + "nauc_recall_at_100_diff1": 0.187483, + "nauc_recall_at_1000_max": 0.260578, + "nauc_recall_at_1000_std": 0.352374, + "nauc_recall_at_1000_diff1": 0.206476, + "nauc_precision_at_1_max": 0.231479, + "nauc_precision_at_1_std": 0.009344, + "nauc_precision_at_1_diff1": 0.284906, + "nauc_precision_at_3_max": 0.232454, + "nauc_precision_at_3_std": 0.037917, + "nauc_precision_at_3_diff1": 0.189271, + "nauc_precision_at_5_max": 0.205819, + "nauc_precision_at_5_std": 0.030816, + "nauc_precision_at_5_diff1": 0.162951, + "nauc_precision_at_10_max": 0.188984, + "nauc_precision_at_10_std": 0.038415, + "nauc_precision_at_10_diff1": 0.15449, + "nauc_precision_at_20_max": 0.197668, + "nauc_precision_at_20_std": 0.044438, + "nauc_precision_at_20_diff1": 0.106451, + "nauc_precision_at_100_max": 0.129045, + "nauc_precision_at_100_std": 0.074455, + "nauc_precision_at_100_diff1": 0.017554, + "nauc_precision_at_1000_max": 0.060491, + "nauc_precision_at_1000_std": 0.011265, + "nauc_precision_at_1000_diff1": -0.020366, + "nauc_mrr_at_1_max": 0.231479, + "nauc_mrr_at_1_std": 0.009344, + "nauc_mrr_at_1_diff1": 0.284906, + "nauc_mrr_at_3_max": 0.237371, + "nauc_mrr_at_3_std": 0.020216, + "nauc_mrr_at_3_diff1": 0.249946, + "nauc_mrr_at_5_max": 0.233754, + "nauc_mrr_at_5_std": 0.020675, + "nauc_mrr_at_5_diff1": 0.247143, + "nauc_mrr_at_10_max": 0.236099, + "nauc_mrr_at_10_std": 0.022712, + "nauc_mrr_at_10_diff1": 0.250387, + "nauc_mrr_at_20_max": 0.237053, + "nauc_mrr_at_20_std": 0.024975, + "nauc_mrr_at_20_diff1": 0.249781, + "nauc_mrr_at_100_max": 0.236334, + "nauc_mrr_at_100_std": 0.02589, + "nauc_mrr_at_100_diff1": 0.249535, + "nauc_mrr_at_1000_max": 0.236279, + "nauc_mrr_at_1000_std": 0.025708, + "nauc_mrr_at_1000_diff1": 0.24965, + "main_score": 0.33912, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 3.874798536300659, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackPhysicsRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackPhysicsRetrieval.json new file mode 100644 index 0000000000..494d33f2dd --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackPhysicsRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4", + "task_name": "CQADupstackPhysicsRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.38595, + "ndcg_at_3": 0.43321, + "ndcg_at_5": 0.46594, + "ndcg_at_10": 0.4921, + "ndcg_at_20": 0.51081, + "ndcg_at_100": 0.5428, + "ndcg_at_1000": 0.56203, + "map_at_1": 0.31266, + "map_at_3": 0.38965, + "map_at_5": 0.41377, + "map_at_10": 0.42791, + "map_at_20": 0.43453, + "map_at_100": 0.44061, + "map_at_1000": 0.44169, + "recall_at_1": 0.31266, + "recall_at_3": 0.4617, + "recall_at_5": 0.54697, + "recall_at_10": 0.62709, + "recall_at_20": 0.68966, + "recall_at_100": 0.83523, + "recall_at_1000": 0.96077, + "precision_at_1": 0.38595, + "precision_at_3": 0.20597, + "precision_at_5": 0.15072, + "precision_at_10": 0.0897, + "precision_at_20": 0.05159, + "precision_at_100": 0.01349, + "precision_at_1000": 0.00168, + "mrr_at_1": 0.385948, + "mrr_at_3": 0.456529, + "mrr_at_5": 0.475201, + "mrr_at_10": 0.485558, + "mrr_at_20": 0.489733, + "mrr_at_100": 0.49294, + "mrr_at_1000": 0.493368, + "nauc_ndcg_at_1_max": 0.378303, + "nauc_ndcg_at_1_std": -0.004562, + "nauc_ndcg_at_1_diff1": 0.529947, + "nauc_ndcg_at_3_max": 0.366288, + "nauc_ndcg_at_3_std": 0.014108, + "nauc_ndcg_at_3_diff1": 0.480487, + "nauc_ndcg_at_5_max": 0.35407, + "nauc_ndcg_at_5_std": 0.024982, + "nauc_ndcg_at_5_diff1": 0.480003, + "nauc_ndcg_at_10_max": 0.35564, + "nauc_ndcg_at_10_std": 0.029399, + "nauc_ndcg_at_10_diff1": 0.477454, + "nauc_ndcg_at_20_max": 0.354337, + "nauc_ndcg_at_20_std": 0.035823, + "nauc_ndcg_at_20_diff1": 0.471136, + "nauc_ndcg_at_100_max": 0.36412, + "nauc_ndcg_at_100_std": 0.056256, + "nauc_ndcg_at_100_diff1": 0.477283, + "nauc_ndcg_at_1000_max": 0.366449, + "nauc_ndcg_at_1000_std": 0.051063, + "nauc_ndcg_at_1000_diff1": 0.476378, + "nauc_map_at_1_max": 0.342191, + "nauc_map_at_1_std": -0.041708, + "nauc_map_at_1_diff1": 0.546326, + "nauc_map_at_3_max": 0.354007, + "nauc_map_at_3_std": -0.006021, + "nauc_map_at_3_diff1": 0.495718, + "nauc_map_at_5_max": 0.352776, + "nauc_map_at_5_std": 0.004155, + "nauc_map_at_5_diff1": 0.494151, + "nauc_map_at_10_max": 0.355719, + "nauc_map_at_10_std": 0.0112, + "nauc_map_at_10_diff1": 0.491821, + "nauc_map_at_20_max": 0.355882, + "nauc_map_at_20_std": 0.013928, + "nauc_map_at_20_diff1": 0.49053, + "nauc_map_at_100_max": 0.357908, + "nauc_map_at_100_std": 0.017492, + "nauc_map_at_100_diff1": 0.491664, + "nauc_map_at_1000_max": 0.35813, + "nauc_map_at_1000_std": 0.017618, + "nauc_map_at_1000_diff1": 0.491616, + "nauc_recall_at_1_max": 0.342191, + "nauc_recall_at_1_std": -0.041708, + "nauc_recall_at_1_diff1": 0.546326, + "nauc_recall_at_3_max": 0.337006, + "nauc_recall_at_3_std": 0.012608, + "nauc_recall_at_3_diff1": 0.436798, + "nauc_recall_at_5_max": 0.307271, + "nauc_recall_at_5_std": 0.044795, + "nauc_recall_at_5_diff1": 0.421271, + "nauc_recall_at_10_max": 0.309587, + "nauc_recall_at_10_std": 0.062143, + "nauc_recall_at_10_diff1": 0.407524, + "nauc_recall_at_20_max": 0.296181, + "nauc_recall_at_20_std": 0.090944, + "nauc_recall_at_20_diff1": 0.372629, + "nauc_recall_at_100_max": 0.352182, + "nauc_recall_at_100_std": 0.295735, + "nauc_recall_at_100_diff1": 0.389912, + "nauc_recall_at_1000_max": 0.519468, + "nauc_recall_at_1000_std": 0.609643, + "nauc_recall_at_1000_diff1": 0.262596, + "nauc_precision_at_1_max": 0.378303, + "nauc_precision_at_1_std": -0.004562, + "nauc_precision_at_1_diff1": 0.529947, + "nauc_precision_at_3_max": 0.335759, + "nauc_precision_at_3_std": 0.088528, + "nauc_precision_at_3_diff1": 0.31813, + "nauc_precision_at_5_max": 0.270905, + "nauc_precision_at_5_std": 0.129495, + "nauc_precision_at_5_diff1": 0.241026, + "nauc_precision_at_10_max": 0.234787, + "nauc_precision_at_10_std": 0.172353, + "nauc_precision_at_10_diff1": 0.15564, + "nauc_precision_at_20_max": 0.173806, + "nauc_precision_at_20_std": 0.183874, + "nauc_precision_at_20_diff1": 0.070198, + "nauc_precision_at_100_max": 0.077608, + "nauc_precision_at_100_std": 0.203109, + "nauc_precision_at_100_diff1": -0.049697, + "nauc_precision_at_1000_max": -0.030479, + "nauc_precision_at_1000_std": 0.149097, + "nauc_precision_at_1000_diff1": -0.159205, + "nauc_mrr_at_1_max": 0.378303, + "nauc_mrr_at_1_std": -0.004562, + "nauc_mrr_at_1_diff1": 0.529947, + "nauc_mrr_at_3_max": 0.379001, + "nauc_mrr_at_3_std": 0.016944, + "nauc_mrr_at_3_diff1": 0.486339, + "nauc_mrr_at_5_max": 0.370101, + "nauc_mrr_at_5_std": 0.021582, + "nauc_mrr_at_5_diff1": 0.486, + "nauc_mrr_at_10_max": 0.370587, + "nauc_mrr_at_10_std": 0.022374, + "nauc_mrr_at_10_diff1": 0.486502, + "nauc_mrr_at_20_max": 0.370464, + "nauc_mrr_at_20_std": 0.02321, + "nauc_mrr_at_20_diff1": 0.484714, + "nauc_mrr_at_100_max": 0.37177, + "nauc_mrr_at_100_std": 0.024504, + "nauc_mrr_at_100_diff1": 0.485737, + "nauc_mrr_at_1000_max": 0.371827, + "nauc_mrr_at_1000_std": 0.024254, + "nauc_mrr_at_1000_diff1": 0.485721, + "main_score": 0.4921, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 5.869836091995239, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackProgrammersRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackProgrammersRetrieval.json new file mode 100644 index 0000000000..e3ef321aa9 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackProgrammersRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "6184bc1440d2dbc7612be22b50686b8826d22b32", + "task_name": "CQADupstackProgrammersRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.34475, + "ndcg_at_3": 0.3856, + "ndcg_at_5": 0.4148, + "ndcg_at_10": 0.44073, + "ndcg_at_20": 0.4666, + "ndcg_at_100": 0.50111, + "ndcg_at_1000": 0.51988, + "map_at_1": 0.27333, + "map_at_3": 0.34464, + "map_at_5": 0.36672, + "map_at_10": 0.37956, + "map_at_20": 0.3884, + "map_at_100": 0.3945, + "map_at_1000": 0.39548, + "recall_at_1": 0.27333, + "recall_at_3": 0.41267, + "recall_at_5": 0.48823, + "recall_at_10": 0.56693, + "recall_at_20": 0.65829, + "recall_at_100": 0.81984, + "recall_at_1000": 0.94469, + "precision_at_1": 0.34475, + "precision_at_3": 0.18493, + "precision_at_5": 0.13516, + "precision_at_10": 0.08105, + "precision_at_20": 0.04886, + "precision_at_100": 0.013, + "precision_at_1000": 0.00161, + "mrr_at_1": 0.344749, + "mrr_at_3": 0.408676, + "mrr_at_5": 0.426027, + "mrr_at_10": 0.436841, + "mrr_at_20": 0.442728, + "mrr_at_100": 0.446494, + "mrr_at_1000": 0.446926, + "nauc_ndcg_at_1_max": 0.397641, + "nauc_ndcg_at_1_std": 0.039251, + "nauc_ndcg_at_1_diff1": 0.445659, + "nauc_ndcg_at_3_max": 0.382589, + "nauc_ndcg_at_3_std": 0.018499, + "nauc_ndcg_at_3_diff1": 0.369831, + "nauc_ndcg_at_5_max": 0.387342, + "nauc_ndcg_at_5_std": 0.039866, + "nauc_ndcg_at_5_diff1": 0.373769, + "nauc_ndcg_at_10_max": 0.386575, + "nauc_ndcg_at_10_std": 0.058274, + "nauc_ndcg_at_10_diff1": 0.370426, + "nauc_ndcg_at_20_max": 0.395146, + "nauc_ndcg_at_20_std": 0.065832, + "nauc_ndcg_at_20_diff1": 0.382554, + "nauc_ndcg_at_100_max": 0.403547, + "nauc_ndcg_at_100_std": 0.085445, + "nauc_ndcg_at_100_diff1": 0.391128, + "nauc_ndcg_at_1000_max": 0.40077, + "nauc_ndcg_at_1000_std": 0.07439, + "nauc_ndcg_at_1000_diff1": 0.390814, + "nauc_map_at_1_max": 0.350632, + "nauc_map_at_1_std": -0.005404, + "nauc_map_at_1_diff1": 0.451445, + "nauc_map_at_3_max": 0.369092, + "nauc_map_at_3_std": 0.004003, + "nauc_map_at_3_diff1": 0.392619, + "nauc_map_at_5_max": 0.378522, + "nauc_map_at_5_std": 0.02141, + "nauc_map_at_5_diff1": 0.392841, + "nauc_map_at_10_max": 0.378978, + "nauc_map_at_10_std": 0.030881, + "nauc_map_at_10_diff1": 0.389168, + "nauc_map_at_20_max": 0.383397, + "nauc_map_at_20_std": 0.033992, + "nauc_map_at_20_diff1": 0.393318, + "nauc_map_at_100_max": 0.385488, + "nauc_map_at_100_std": 0.037565, + "nauc_map_at_100_diff1": 0.395518, + "nauc_map_at_1000_max": 0.385387, + "nauc_map_at_1000_std": 0.037427, + "nauc_map_at_1000_diff1": 0.395469, + "nauc_recall_at_1_max": 0.350632, + "nauc_recall_at_1_std": -0.005404, + "nauc_recall_at_1_diff1": 0.451445, + "nauc_recall_at_3_max": 0.356361, + "nauc_recall_at_3_std": 0.013345, + "nauc_recall_at_3_diff1": 0.324132, + "nauc_recall_at_5_max": 0.363771, + "nauc_recall_at_5_std": 0.060518, + "nauc_recall_at_5_diff1": 0.316107, + "nauc_recall_at_10_max": 0.35361, + "nauc_recall_at_10_std": 0.115485, + "nauc_recall_at_10_diff1": 0.293829, + "nauc_recall_at_20_max": 0.372771, + "nauc_recall_at_20_std": 0.153363, + "nauc_recall_at_20_diff1": 0.324125, + "nauc_recall_at_100_max": 0.422918, + "nauc_recall_at_100_std": 0.374391, + "nauc_recall_at_100_diff1": 0.354287, + "nauc_recall_at_1000_max": 0.415002, + "nauc_recall_at_1000_std": 0.508242, + "nauc_recall_at_1000_diff1": 0.367822, + "nauc_precision_at_1_max": 0.397641, + "nauc_precision_at_1_std": 0.039251, + "nauc_precision_at_1_diff1": 0.445659, + "nauc_precision_at_3_max": 0.366452, + "nauc_precision_at_3_std": 0.072522, + "nauc_precision_at_3_diff1": 0.220843, + "nauc_precision_at_5_max": 0.345655, + "nauc_precision_at_5_std": 0.119149, + "nauc_precision_at_5_diff1": 0.190929, + "nauc_precision_at_10_max": 0.298519, + "nauc_precision_at_10_std": 0.159767, + "nauc_precision_at_10_diff1": 0.129888, + "nauc_precision_at_20_max": 0.256837, + "nauc_precision_at_20_std": 0.157964, + "nauc_precision_at_20_diff1": 0.110048, + "nauc_precision_at_100_max": 0.137123, + "nauc_precision_at_100_std": 0.156712, + "nauc_precision_at_100_diff1": 0.0139, + "nauc_precision_at_1000_max": -0.018798, + "nauc_precision_at_1000_std": 0.062593, + "nauc_precision_at_1000_diff1": -0.102659, + "nauc_mrr_at_1_max": 0.397641, + "nauc_mrr_at_1_std": 0.039251, + "nauc_mrr_at_1_diff1": 0.445659, + "nauc_mrr_at_3_max": 0.407853, + "nauc_mrr_at_3_std": 0.040804, + "nauc_mrr_at_3_diff1": 0.393704, + "nauc_mrr_at_5_max": 0.407073, + "nauc_mrr_at_5_std": 0.050216, + "nauc_mrr_at_5_diff1": 0.393753, + "nauc_mrr_at_10_max": 0.405894, + "nauc_mrr_at_10_std": 0.055276, + "nauc_mrr_at_10_diff1": 0.392104, + "nauc_mrr_at_20_max": 0.406578, + "nauc_mrr_at_20_std": 0.055479, + "nauc_mrr_at_20_diff1": 0.394091, + "nauc_mrr_at_100_max": 0.406906, + "nauc_mrr_at_100_std": 0.057411, + "nauc_mrr_at_100_diff1": 0.394849, + "nauc_mrr_at_1000_max": 0.406911, + "nauc_mrr_at_1000_std": 0.057124, + "nauc_mrr_at_1000_diff1": 0.395046, + "main_score": 0.44073, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 4.882723808288574, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackStatsRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackStatsRetrieval.json new file mode 100644 index 0000000000..fb9b756539 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackStatsRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "65ac3a16b8e91f9cee4c9828cc7c335575432a2a", + "task_name": "CQADupstackStatsRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.27761, + "ndcg_at_3": 0.32663, + "ndcg_at_5": 0.34131, + "ndcg_at_10": 0.36504, + "ndcg_at_20": 0.38291, + "ndcg_at_100": 0.41237, + "ndcg_at_1000": 0.43876, + "map_at_1": 0.2505, + "map_at_3": 0.30271, + "map_at_5": 0.31164, + "map_at_10": 0.32226, + "map_at_20": 0.32744, + "map_at_100": 0.3316, + "map_at_1000": 0.33271, + "recall_at_1": 0.2505, + "recall_at_3": 0.36206, + "recall_at_5": 0.39948, + "recall_at_10": 0.46991, + "recall_at_20": 0.53624, + "recall_at_100": 0.68629, + "recall_at_1000": 0.87889, + "precision_at_1": 0.27761, + "precision_at_3": 0.14059, + "precision_at_5": 0.09417, + "precision_at_10": 0.05675, + "precision_at_20": 0.03305, + "precision_at_100": 0.00879, + "precision_at_1000": 0.00118, + "mrr_at_1": 0.277607, + "mrr_at_3": 0.329499, + "mrr_at_5": 0.339468, + "mrr_at_10": 0.349337, + "mrr_at_20": 0.353905, + "mrr_at_100": 0.357466, + "mrr_at_1000": 0.358224, + "nauc_ndcg_at_1_max": 0.448411, + "nauc_ndcg_at_1_std": -0.013126, + "nauc_ndcg_at_1_diff1": 0.597178, + "nauc_ndcg_at_3_max": 0.427975, + "nauc_ndcg_at_3_std": 0.024626, + "nauc_ndcg_at_3_diff1": 0.518556, + "nauc_ndcg_at_5_max": 0.416214, + "nauc_ndcg_at_5_std": 0.01684, + "nauc_ndcg_at_5_diff1": 0.508028, + "nauc_ndcg_at_10_max": 0.42287, + "nauc_ndcg_at_10_std": 0.030475, + "nauc_ndcg_at_10_diff1": 0.498489, + "nauc_ndcg_at_20_max": 0.418893, + "nauc_ndcg_at_20_std": 0.037909, + "nauc_ndcg_at_20_diff1": 0.492478, + "nauc_ndcg_at_100_max": 0.427082, + "nauc_ndcg_at_100_std": 0.05407, + "nauc_ndcg_at_100_diff1": 0.488937, + "nauc_ndcg_at_1000_max": 0.432609, + "nauc_ndcg_at_1000_std": 0.060383, + "nauc_ndcg_at_1000_diff1": 0.493733, + "nauc_map_at_1_max": 0.413501, + "nauc_map_at_1_std": -0.031212, + "nauc_map_at_1_diff1": 0.581888, + "nauc_map_at_3_max": 0.420579, + "nauc_map_at_3_std": 0.009495, + "nauc_map_at_3_diff1": 0.532353, + "nauc_map_at_5_max": 0.416532, + "nauc_map_at_5_std": 0.007827, + "nauc_map_at_5_diff1": 0.526819, + "nauc_map_at_10_max": 0.422262, + "nauc_map_at_10_std": 0.015379, + "nauc_map_at_10_diff1": 0.523528, + "nauc_map_at_20_max": 0.421341, + "nauc_map_at_20_std": 0.017841, + "nauc_map_at_20_diff1": 0.521953, + "nauc_map_at_100_max": 0.422941, + "nauc_map_at_100_std": 0.020426, + "nauc_map_at_100_diff1": 0.521613, + "nauc_map_at_1000_max": 0.423149, + "nauc_map_at_1000_std": 0.020652, + "nauc_map_at_1000_diff1": 0.521779, + "nauc_recall_at_1_max": 0.413501, + "nauc_recall_at_1_std": -0.031212, + "nauc_recall_at_1_diff1": 0.581888, + "nauc_recall_at_3_max": 0.405939, + "nauc_recall_at_3_std": 0.040949, + "nauc_recall_at_3_diff1": 0.462376, + "nauc_recall_at_5_max": 0.381247, + "nauc_recall_at_5_std": 0.02567, + "nauc_recall_at_5_diff1": 0.435367, + "nauc_recall_at_10_max": 0.394714, + "nauc_recall_at_10_std": 0.065503, + "nauc_recall_at_10_diff1": 0.406372, + "nauc_recall_at_20_max": 0.370246, + "nauc_recall_at_20_std": 0.089839, + "nauc_recall_at_20_diff1": 0.372781, + "nauc_recall_at_100_max": 0.395534, + "nauc_recall_at_100_std": 0.195651, + "nauc_recall_at_100_diff1": 0.313649, + "nauc_recall_at_1000_max": 0.480669, + "nauc_recall_at_1000_std": 0.481718, + "nauc_recall_at_1000_diff1": 0.228327, + "nauc_precision_at_1_max": 0.448411, + "nauc_precision_at_1_std": -0.013126, + "nauc_precision_at_1_diff1": 0.597178, + "nauc_precision_at_3_max": 0.438281, + "nauc_precision_at_3_std": 0.096133, + "nauc_precision_at_3_diff1": 0.44557, + "nauc_precision_at_5_max": 0.417458, + "nauc_precision_at_5_std": 0.097188, + "nauc_precision_at_5_diff1": 0.417407, + "nauc_precision_at_10_max": 0.419365, + "nauc_precision_at_10_std": 0.141248, + "nauc_precision_at_10_diff1": 0.354298, + "nauc_precision_at_20_max": 0.363151, + "nauc_precision_at_20_std": 0.167029, + "nauc_precision_at_20_diff1": 0.286847, + "nauc_precision_at_100_max": 0.313428, + "nauc_precision_at_100_std": 0.208383, + "nauc_precision_at_100_diff1": 0.174274, + "nauc_precision_at_1000_max": 0.167689, + "nauc_precision_at_1000_std": 0.190164, + "nauc_precision_at_1000_diff1": 0.022743, + "nauc_mrr_at_1_max": 0.448411, + "nauc_mrr_at_1_std": -0.013126, + "nauc_mrr_at_1_diff1": 0.597178, + "nauc_mrr_at_3_max": 0.443157, + "nauc_mrr_at_3_std": 0.018439, + "nauc_mrr_at_3_diff1": 0.540921, + "nauc_mrr_at_5_max": 0.437186, + "nauc_mrr_at_5_std": 0.015712, + "nauc_mrr_at_5_diff1": 0.534764, + "nauc_mrr_at_10_max": 0.438221, + "nauc_mrr_at_10_std": 0.018455, + "nauc_mrr_at_10_diff1": 0.53019, + "nauc_mrr_at_20_max": 0.437876, + "nauc_mrr_at_20_std": 0.020614, + "nauc_mrr_at_20_diff1": 0.529212, + "nauc_mrr_at_100_max": 0.438686, + "nauc_mrr_at_100_std": 0.022636, + "nauc_mrr_at_100_diff1": 0.52908, + "nauc_mrr_at_1000_max": 0.438977, + "nauc_mrr_at_1000_std": 0.0228, + "nauc_mrr_at_1000_diff1": 0.529321, + "main_score": 0.36504, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 5.857112646102905, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackTexRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackTexRetrieval.json new file mode 100644 index 0000000000..896fb0c241 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackTexRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "46989137a86843e03a6195de44b09deda022eec7", + "task_name": "CQADupstackTexRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.22608, + "ndcg_at_3": 0.27421, + "ndcg_at_5": 0.29387, + "ndcg_at_10": 0.31763, + "ndcg_at_20": 0.3383, + "ndcg_at_100": 0.37148, + "ndcg_at_1000": 0.40154, + "map_at_1": 0.18563, + "map_at_3": 0.24249, + "map_at_5": 0.2561, + "map_at_10": 0.26736, + "map_at_20": 0.27379, + "map_at_100": 0.27907, + "map_at_1000": 0.28041, + "recall_at_1": 0.18563, + "recall_at_3": 0.3052, + "recall_at_5": 0.35699, + "recall_at_10": 0.42763, + "recall_at_20": 0.50414, + "recall_at_100": 0.66696, + "recall_at_1000": 0.87935, + "precision_at_1": 0.22608, + "precision_at_3": 0.13203, + "precision_at_5": 0.09484, + "precision_at_10": 0.05867, + "precision_at_20": 0.03541, + "precision_at_100": 0.01003, + "precision_at_1000": 0.00144, + "mrr_at_1": 0.226084, + "mrr_at_3": 0.284641, + "mrr_at_5": 0.297769, + "mrr_at_10": 0.307698, + "mrr_at_20": 0.313134, + "mrr_at_100": 0.31715, + "mrr_at_1000": 0.317937, + "nauc_ndcg_at_1_max": 0.311265, + "nauc_ndcg_at_1_std": -0.029793, + "nauc_ndcg_at_1_diff1": 0.382216, + "nauc_ndcg_at_3_max": 0.305509, + "nauc_ndcg_at_3_std": -0.012316, + "nauc_ndcg_at_3_diff1": 0.323998, + "nauc_ndcg_at_5_max": 0.308415, + "nauc_ndcg_at_5_std": -0.003068, + "nauc_ndcg_at_5_diff1": 0.314397, + "nauc_ndcg_at_10_max": 0.308415, + "nauc_ndcg_at_10_std": 0.007106, + "nauc_ndcg_at_10_diff1": 0.308222, + "nauc_ndcg_at_20_max": 0.310932, + "nauc_ndcg_at_20_std": 0.015157, + "nauc_ndcg_at_20_diff1": 0.309304, + "nauc_ndcg_at_100_max": 0.314027, + "nauc_ndcg_at_100_std": 0.030986, + "nauc_ndcg_at_100_diff1": 0.307135, + "nauc_ndcg_at_1000_max": 0.315806, + "nauc_ndcg_at_1000_std": 0.031075, + "nauc_ndcg_at_1000_diff1": 0.310606, + "nauc_map_at_1_max": 0.291041, + "nauc_map_at_1_std": -0.029926, + "nauc_map_at_1_diff1": 0.381991, + "nauc_map_at_3_max": 0.298633, + "nauc_map_at_3_std": -0.017084, + "nauc_map_at_3_diff1": 0.338144, + "nauc_map_at_5_max": 0.302278, + "nauc_map_at_5_std": -0.012788, + "nauc_map_at_5_diff1": 0.331826, + "nauc_map_at_10_max": 0.302663, + "nauc_map_at_10_std": -0.008608, + "nauc_map_at_10_diff1": 0.328626, + "nauc_map_at_20_max": 0.304087, + "nauc_map_at_20_std": -0.006128, + "nauc_map_at_20_diff1": 0.329021, + "nauc_map_at_100_max": 0.305057, + "nauc_map_at_100_std": -0.003387, + "nauc_map_at_100_diff1": 0.328962, + "nauc_map_at_1000_max": 0.305426, + "nauc_map_at_1000_std": -0.003169, + "nauc_map_at_1000_diff1": 0.329248, + "nauc_recall_at_1_max": 0.291041, + "nauc_recall_at_1_std": -0.029926, + "nauc_recall_at_1_diff1": 0.381991, + "nauc_recall_at_3_max": 0.287102, + "nauc_recall_at_3_std": 0.000768, + "nauc_recall_at_3_diff1": 0.280408, + "nauc_recall_at_5_max": 0.294123, + "nauc_recall_at_5_std": 0.019143, + "nauc_recall_at_5_diff1": 0.257284, + "nauc_recall_at_10_max": 0.290965, + "nauc_recall_at_10_std": 0.043028, + "nauc_recall_at_10_diff1": 0.236586, + "nauc_recall_at_20_max": 0.292611, + "nauc_recall_at_20_std": 0.072578, + "nauc_recall_at_20_diff1": 0.234031, + "nauc_recall_at_100_max": 0.301256, + "nauc_recall_at_100_std": 0.169465, + "nauc_recall_at_100_diff1": 0.205552, + "nauc_recall_at_1000_max": 0.3214, + "nauc_recall_at_1000_std": 0.326304, + "nauc_recall_at_1000_diff1": 0.150418, + "nauc_precision_at_1_max": 0.311265, + "nauc_precision_at_1_std": -0.029793, + "nauc_precision_at_1_diff1": 0.382216, + "nauc_precision_at_3_max": 0.31099, + "nauc_precision_at_3_std": -0.002732, + "nauc_precision_at_3_diff1": 0.269625, + "nauc_precision_at_5_max": 0.307033, + "nauc_precision_at_5_std": 0.013936, + "nauc_precision_at_5_diff1": 0.239477, + "nauc_precision_at_10_max": 0.291896, + "nauc_precision_at_10_std": 0.042897, + "nauc_precision_at_10_diff1": 0.212624, + "nauc_precision_at_20_max": 0.274845, + "nauc_precision_at_20_std": 0.060583, + "nauc_precision_at_20_diff1": 0.196898, + "nauc_precision_at_100_max": 0.235437, + "nauc_precision_at_100_std": 0.094634, + "nauc_precision_at_100_diff1": 0.143262, + "nauc_precision_at_1000_max": 0.175069, + "nauc_precision_at_1000_std": 0.057981, + "nauc_precision_at_1000_diff1": 0.092406, + "nauc_mrr_at_1_max": 0.311265, + "nauc_mrr_at_1_std": -0.029793, + "nauc_mrr_at_1_diff1": 0.382216, + "nauc_mrr_at_3_max": 0.312049, + "nauc_mrr_at_3_std": -0.012617, + "nauc_mrr_at_3_diff1": 0.333542, + "nauc_mrr_at_5_max": 0.314353, + "nauc_mrr_at_5_std": -0.007121, + "nauc_mrr_at_5_diff1": 0.327824, + "nauc_mrr_at_10_max": 0.314417, + "nauc_mrr_at_10_std": -0.002959, + "nauc_mrr_at_10_diff1": 0.326206, + "nauc_mrr_at_20_max": 0.315223, + "nauc_mrr_at_20_std": -0.001169, + "nauc_mrr_at_20_diff1": 0.327288, + "nauc_mrr_at_100_max": 0.315359, + "nauc_mrr_at_100_std": 5e-06, + "nauc_mrr_at_100_diff1": 0.326989, + "nauc_mrr_at_1000_max": 0.315396, + "nauc_mrr_at_1000_std": 0.000121, + "nauc_mrr_at_1000_diff1": 0.327033, + "main_score": 0.31763, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 17.137136697769165, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackUnixRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackUnixRetrieval.json new file mode 100644 index 0000000000..c416182795 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackUnixRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "6c6430d3a6d36f8d2a829195bc5dc94d7e063e53", + "task_name": "CQADupstackUnixRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.33769, + "ndcg_at_3": 0.38203, + "ndcg_at_5": 0.40706, + "ndcg_at_10": 0.43429, + "ndcg_at_20": 0.45367, + "ndcg_at_100": 0.48494, + "ndcg_at_1000": 0.50737, + "map_at_1": 0.28119, + "map_at_3": 0.34614, + "map_at_5": 0.36319, + "map_at_10": 0.37609, + "map_at_20": 0.38242, + "map_at_100": 0.38742, + "map_at_1000": 0.38842, + "recall_at_1": 0.28119, + "recall_at_3": 0.41638, + "recall_at_5": 0.48319, + "recall_at_10": 0.56333, + "recall_at_20": 0.63211, + "recall_at_100": 0.78339, + "recall_at_1000": 0.93921, + "precision_at_1": 0.33769, + "precision_at_3": 0.176, + "precision_at_5": 0.12351, + "precision_at_10": 0.07388, + "precision_at_20": 0.04244, + "precision_at_100": 0.01112, + "precision_at_1000": 0.00141, + "mrr_at_1": 0.337687, + "mrr_at_3": 0.399254, + "mrr_at_5": 0.414739, + "mrr_at_10": 0.425785, + "mrr_at_20": 0.430479, + "mrr_at_100": 0.433771, + "mrr_at_1000": 0.434306, + "nauc_ndcg_at_1_max": 0.424149, + "nauc_ndcg_at_1_std": -0.070256, + "nauc_ndcg_at_1_diff1": 0.512801, + "nauc_ndcg_at_3_max": 0.411203, + "nauc_ndcg_at_3_std": -0.049973, + "nauc_ndcg_at_3_diff1": 0.469277, + "nauc_ndcg_at_5_max": 0.408392, + "nauc_ndcg_at_5_std": -0.03928, + "nauc_ndcg_at_5_diff1": 0.45576, + "nauc_ndcg_at_10_max": 0.411119, + "nauc_ndcg_at_10_std": -0.027399, + "nauc_ndcg_at_10_diff1": 0.440864, + "nauc_ndcg_at_20_max": 0.413441, + "nauc_ndcg_at_20_std": -0.021734, + "nauc_ndcg_at_20_diff1": 0.436225, + "nauc_ndcg_at_100_max": 0.419831, + "nauc_ndcg_at_100_std": -0.007288, + "nauc_ndcg_at_100_diff1": 0.441649, + "nauc_ndcg_at_1000_max": 0.416516, + "nauc_ndcg_at_1000_std": -0.014408, + "nauc_ndcg_at_1000_diff1": 0.44195, + "nauc_map_at_1_max": 0.396387, + "nauc_map_at_1_std": -0.075039, + "nauc_map_at_1_diff1": 0.51609, + "nauc_map_at_3_max": 0.40686, + "nauc_map_at_3_std": -0.059326, + "nauc_map_at_3_diff1": 0.485255, + "nauc_map_at_5_max": 0.40673, + "nauc_map_at_5_std": -0.052185, + "nauc_map_at_5_diff1": 0.476163, + "nauc_map_at_10_max": 0.408586, + "nauc_map_at_10_std": -0.048073, + "nauc_map_at_10_diff1": 0.468441, + "nauc_map_at_20_max": 0.409567, + "nauc_map_at_20_std": -0.046605, + "nauc_map_at_20_diff1": 0.467016, + "nauc_map_at_100_max": 0.411125, + "nauc_map_at_100_std": -0.044396, + "nauc_map_at_100_diff1": 0.46814, + "nauc_map_at_1000_max": 0.41089, + "nauc_map_at_1000_std": -0.044487, + "nauc_map_at_1000_diff1": 0.468063, + "nauc_recall_at_1_max": 0.396387, + "nauc_recall_at_1_std": -0.075039, + "nauc_recall_at_1_diff1": 0.51609, + "nauc_recall_at_3_max": 0.389404, + "nauc_recall_at_3_std": -0.035958, + "nauc_recall_at_3_diff1": 0.42968, + "nauc_recall_at_5_max": 0.377554, + "nauc_recall_at_5_std": -0.008589, + "nauc_recall_at_5_diff1": 0.387092, + "nauc_recall_at_10_max": 0.372372, + "nauc_recall_at_10_std": 0.026717, + "nauc_recall_at_10_diff1": 0.332167, + "nauc_recall_at_20_max": 0.379233, + "nauc_recall_at_20_std": 0.056414, + "nauc_recall_at_20_diff1": 0.306136, + "nauc_recall_at_100_max": 0.414187, + "nauc_recall_at_100_std": 0.204227, + "nauc_recall_at_100_diff1": 0.298569, + "nauc_recall_at_1000_max": 0.42028, + "nauc_recall_at_1000_std": 0.403871, + "nauc_recall_at_1000_diff1": 0.09736, + "nauc_precision_at_1_max": 0.424149, + "nauc_precision_at_1_std": -0.070256, + "nauc_precision_at_1_diff1": 0.512801, + "nauc_precision_at_3_max": 0.384404, + "nauc_precision_at_3_std": -0.020049, + "nauc_precision_at_3_diff1": 0.366288, + "nauc_precision_at_5_max": 0.365007, + "nauc_precision_at_5_std": 0.007462, + "nauc_precision_at_5_diff1": 0.297504, + "nauc_precision_at_10_max": 0.326678, + "nauc_precision_at_10_std": 0.041079, + "nauc_precision_at_10_diff1": 0.198414, + "nauc_precision_at_20_max": 0.282677, + "nauc_precision_at_20_std": 0.058223, + "nauc_precision_at_20_diff1": 0.12979, + "nauc_precision_at_100_max": 0.183563, + "nauc_precision_at_100_std": 0.119778, + "nauc_precision_at_100_diff1": 0.017943, + "nauc_precision_at_1000_max": -0.001347, + "nauc_precision_at_1000_std": 0.056899, + "nauc_precision_at_1000_diff1": -0.11767, + "nauc_mrr_at_1_max": 0.424149, + "nauc_mrr_at_1_std": -0.070256, + "nauc_mrr_at_1_diff1": 0.512801, + "nauc_mrr_at_3_max": 0.423153, + "nauc_mrr_at_3_std": -0.045603, + "nauc_mrr_at_3_diff1": 0.475093, + "nauc_mrr_at_5_max": 0.421232, + "nauc_mrr_at_5_std": -0.040598, + "nauc_mrr_at_5_diff1": 0.465463, + "nauc_mrr_at_10_max": 0.421948, + "nauc_mrr_at_10_std": -0.035751, + "nauc_mrr_at_10_diff1": 0.461084, + "nauc_mrr_at_20_max": 0.421855, + "nauc_mrr_at_20_std": -0.035484, + "nauc_mrr_at_20_diff1": 0.460581, + "nauc_mrr_at_100_max": 0.422198, + "nauc_mrr_at_100_std": -0.035402, + "nauc_mrr_at_100_diff1": 0.461798, + "nauc_mrr_at_1000_max": 0.422129, + "nauc_mrr_at_1000_std": -0.035552, + "nauc_mrr_at_1000_diff1": 0.461874, + "main_score": 0.43429, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 7.251422882080078, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackWebmastersRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackWebmastersRetrieval.json new file mode 100644 index 0000000000..f8e64671f4 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackWebmastersRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "160c094312a0e1facb97e55eeddb698c0abe3571", + "task_name": "CQADupstackWebmastersRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.31818, + "ndcg_at_3": 0.37099, + "ndcg_at_5": 0.39321, + "ndcg_at_10": 0.42168, + "ndcg_at_20": 0.44159, + "ndcg_at_100": 0.48116, + "ndcg_at_1000": 0.50288, + "map_at_1": 0.26726, + "map_at_3": 0.33054, + "map_at_5": 0.34713, + "map_at_10": 0.36201, + "map_at_20": 0.36956, + "map_at_100": 0.37793, + "map_at_1000": 0.38005, + "recall_at_1": 0.26726, + "recall_at_3": 0.39235, + "recall_at_5": 0.45002, + "recall_at_10": 0.53583, + "recall_at_20": 0.61293, + "recall_at_100": 0.80601, + "recall_at_1000": 0.93931, + "precision_at_1": 0.31818, + "precision_at_3": 0.17325, + "precision_at_5": 0.12648, + "precision_at_10": 0.08162, + "precision_at_20": 0.05069, + "precision_at_100": 0.01595, + "precision_at_1000": 0.00243, + "mrr_at_1": 0.318182, + "mrr_at_3": 0.380105, + "mrr_at_5": 0.393841, + "mrr_at_10": 0.406055, + "mrr_at_20": 0.411634, + "mrr_at_100": 0.415792, + "mrr_at_1000": 0.416241, + "nauc_ndcg_at_1_max": 0.417493, + "nauc_ndcg_at_1_std": 0.028012, + "nauc_ndcg_at_1_diff1": 0.515883, + "nauc_ndcg_at_3_max": 0.39641, + "nauc_ndcg_at_3_std": 0.034673, + "nauc_ndcg_at_3_diff1": 0.483177, + "nauc_ndcg_at_5_max": 0.397146, + "nauc_ndcg_at_5_std": 0.061038, + "nauc_ndcg_at_5_diff1": 0.467181, + "nauc_ndcg_at_10_max": 0.399632, + "nauc_ndcg_at_10_std": 0.067557, + "nauc_ndcg_at_10_diff1": 0.469198, + "nauc_ndcg_at_20_max": 0.408675, + "nauc_ndcg_at_20_std": 0.07474, + "nauc_ndcg_at_20_diff1": 0.481862, + "nauc_ndcg_at_100_max": 0.41571, + "nauc_ndcg_at_100_std": 0.094749, + "nauc_ndcg_at_100_diff1": 0.471658, + "nauc_ndcg_at_1000_max": 0.414311, + "nauc_ndcg_at_1000_std": 0.083462, + "nauc_ndcg_at_1000_diff1": 0.477974, + "nauc_map_at_1_max": 0.402571, + "nauc_map_at_1_std": -0.024844, + "nauc_map_at_1_diff1": 0.551626, + "nauc_map_at_3_max": 0.397674, + "nauc_map_at_3_std": 0.006103, + "nauc_map_at_3_diff1": 0.507803, + "nauc_map_at_5_max": 0.403465, + "nauc_map_at_5_std": 0.018712, + "nauc_map_at_5_diff1": 0.498383, + "nauc_map_at_10_max": 0.406434, + "nauc_map_at_10_std": 0.028061, + "nauc_map_at_10_diff1": 0.496507, + "nauc_map_at_20_max": 0.408435, + "nauc_map_at_20_std": 0.036694, + "nauc_map_at_20_diff1": 0.49803, + "nauc_map_at_100_max": 0.409898, + "nauc_map_at_100_std": 0.045306, + "nauc_map_at_100_diff1": 0.49541, + "nauc_map_at_1000_max": 0.408244, + "nauc_map_at_1000_std": 0.045699, + "nauc_map_at_1000_diff1": 0.494811, + "nauc_recall_at_1_max": 0.402571, + "nauc_recall_at_1_std": -0.024844, + "nauc_recall_at_1_diff1": 0.551626, + "nauc_recall_at_3_max": 0.36185, + "nauc_recall_at_3_std": 0.026374, + "nauc_recall_at_3_diff1": 0.458239, + "nauc_recall_at_5_max": 0.363405, + "nauc_recall_at_5_std": 0.07565, + "nauc_recall_at_5_diff1": 0.411704, + "nauc_recall_at_10_max": 0.369469, + "nauc_recall_at_10_std": 0.106272, + "nauc_recall_at_10_diff1": 0.406365, + "nauc_recall_at_20_max": 0.397016, + "nauc_recall_at_20_std": 0.151894, + "nauc_recall_at_20_diff1": 0.435917, + "nauc_recall_at_100_max": 0.399484, + "nauc_recall_at_100_std": 0.343379, + "nauc_recall_at_100_diff1": 0.316471, + "nauc_recall_at_1000_max": 0.433592, + "nauc_recall_at_1000_std": 0.475785, + "nauc_recall_at_1000_diff1": 0.354811, + "nauc_precision_at_1_max": 0.417493, + "nauc_precision_at_1_std": 0.028012, + "nauc_precision_at_1_diff1": 0.515883, + "nauc_precision_at_3_max": 0.346644, + "nauc_precision_at_3_std": 0.096084, + "nauc_precision_at_3_diff1": 0.331713, + "nauc_precision_at_5_max": 0.32019, + "nauc_precision_at_5_std": 0.178246, + "nauc_precision_at_5_diff1": 0.232968, + "nauc_precision_at_10_max": 0.244467, + "nauc_precision_at_10_std": 0.228442, + "nauc_precision_at_10_diff1": 0.146283, + "nauc_precision_at_20_max": 0.188701, + "nauc_precision_at_20_std": 0.269559, + "nauc_precision_at_20_diff1": 0.106306, + "nauc_precision_at_100_max": 0.028291, + "nauc_precision_at_100_std": 0.240751, + "nauc_precision_at_100_diff1": -0.051774, + "nauc_precision_at_1000_max": -0.130913, + "nauc_precision_at_1000_std": 0.122742, + "nauc_precision_at_1000_diff1": -0.128025, + "nauc_mrr_at_1_max": 0.417493, + "nauc_mrr_at_1_std": 0.028012, + "nauc_mrr_at_1_diff1": 0.515883, + "nauc_mrr_at_3_max": 0.404462, + "nauc_mrr_at_3_std": 0.047816, + "nauc_mrr_at_3_diff1": 0.482216, + "nauc_mrr_at_5_max": 0.4038, + "nauc_mrr_at_5_std": 0.06252, + "nauc_mrr_at_5_diff1": 0.471366, + "nauc_mrr_at_10_max": 0.404138, + "nauc_mrr_at_10_std": 0.063527, + "nauc_mrr_at_10_diff1": 0.473502, + "nauc_mrr_at_20_max": 0.408084, + "nauc_mrr_at_20_std": 0.063661, + "nauc_mrr_at_20_diff1": 0.477426, + "nauc_mrr_at_100_max": 0.407527, + "nauc_mrr_at_100_std": 0.064731, + "nauc_mrr_at_100_diff1": 0.476211, + "nauc_mrr_at_1000_max": 0.407528, + "nauc_mrr_at_1000_std": 0.0645, + "nauc_mrr_at_1000_diff1": 0.476405, + "main_score": 0.42168, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 2.6610183715820312, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackWordpressRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackWordpressRetrieval.json new file mode 100644 index 0000000000..1c763e7127 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CQADupstackWordpressRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "4ffe81d471b1924886b33c7567bfb200e9eec5c4", + "task_name": "CQADupstackWordpressRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.2403, + "ndcg_at_3": 0.30433, + "ndcg_at_5": 0.32707, + "ndcg_at_10": 0.35556, + "ndcg_at_20": 0.3763, + "ndcg_at_100": 0.40363, + "ndcg_at_1000": 0.43005, + "map_at_1": 0.22033, + "map_at_3": 0.27903, + "map_at_5": 0.29288, + "map_at_10": 0.30542, + "map_at_20": 0.31137, + "map_at_100": 0.31523, + "map_at_1000": 0.3163, + "recall_at_1": 0.22033, + "recall_at_3": 0.35086, + "recall_at_5": 0.40514, + "recall_at_10": 0.48866, + "recall_at_20": 0.56919, + "recall_at_100": 0.71052, + "recall_at_1000": 0.90599, + "precision_at_1": 0.2403, + "precision_at_3": 0.13247, + "precision_at_5": 0.09353, + "precision_at_10": 0.05804, + "precision_at_20": 0.03346, + "precision_at_100": 0.00863, + "precision_at_1000": 0.00121, + "mrr_at_1": 0.240296, + "mrr_at_3": 0.302834, + "mrr_at_5": 0.315034, + "mrr_at_10": 0.326008, + "mrr_at_20": 0.331602, + "mrr_at_100": 0.334967, + "mrr_at_1000": 0.335721, + "nauc_ndcg_at_1_max": 0.33044, + "nauc_ndcg_at_1_std": 0.005843, + "nauc_ndcg_at_1_diff1": 0.450283, + "nauc_ndcg_at_3_max": 0.304702, + "nauc_ndcg_at_3_std": -0.014414, + "nauc_ndcg_at_3_diff1": 0.366072, + "nauc_ndcg_at_5_max": 0.305504, + "nauc_ndcg_at_5_std": -0.012375, + "nauc_ndcg_at_5_diff1": 0.353271, + "nauc_ndcg_at_10_max": 0.309214, + "nauc_ndcg_at_10_std": 0.010496, + "nauc_ndcg_at_10_diff1": 0.333544, + "nauc_ndcg_at_20_max": 0.31355, + "nauc_ndcg_at_20_std": 0.028201, + "nauc_ndcg_at_20_diff1": 0.335217, + "nauc_ndcg_at_100_max": 0.315586, + "nauc_ndcg_at_100_std": 0.05462, + "nauc_ndcg_at_100_diff1": 0.334955, + "nauc_ndcg_at_1000_max": 0.321908, + "nauc_ndcg_at_1000_std": 0.042303, + "nauc_ndcg_at_1000_diff1": 0.34299, + "nauc_map_at_1_max": 0.298519, + "nauc_map_at_1_std": -0.018928, + "nauc_map_at_1_diff1": 0.430032, + "nauc_map_at_3_max": 0.2977, + "nauc_map_at_3_std": -0.021816, + "nauc_map_at_3_diff1": 0.372833, + "nauc_map_at_5_max": 0.301633, + "nauc_map_at_5_std": -0.019853, + "nauc_map_at_5_diff1": 0.368438, + "nauc_map_at_10_max": 0.304086, + "nauc_map_at_10_std": -0.00869, + "nauc_map_at_10_diff1": 0.360986, + "nauc_map_at_20_max": 0.305696, + "nauc_map_at_20_std": -0.002749, + "nauc_map_at_20_diff1": 0.362318, + "nauc_map_at_100_max": 0.305822, + "nauc_map_at_100_std": 0.000914, + "nauc_map_at_100_diff1": 0.361901, + "nauc_map_at_1000_max": 0.30606, + "nauc_map_at_1000_std": 0.000399, + "nauc_map_at_1000_diff1": 0.362321, + "nauc_recall_at_1_max": 0.298519, + "nauc_recall_at_1_std": -0.018928, + "nauc_recall_at_1_diff1": 0.430032, + "nauc_recall_at_3_max": 0.28352, + "nauc_recall_at_3_std": -0.023814, + "nauc_recall_at_3_diff1": 0.320485, + "nauc_recall_at_5_max": 0.283428, + "nauc_recall_at_5_std": -0.017239, + "nauc_recall_at_5_diff1": 0.29219, + "nauc_recall_at_10_max": 0.286833, + "nauc_recall_at_10_std": 0.041316, + "nauc_recall_at_10_diff1": 0.232426, + "nauc_recall_at_20_max": 0.296358, + "nauc_recall_at_20_std": 0.106617, + "nauc_recall_at_20_diff1": 0.222931, + "nauc_recall_at_100_max": 0.304869, + "nauc_recall_at_100_std": 0.298337, + "nauc_recall_at_100_diff1": 0.187547, + "nauc_recall_at_1000_max": 0.459059, + "nauc_recall_at_1000_std": 0.403117, + "nauc_recall_at_1000_diff1": 0.14964, + "nauc_precision_at_1_max": 0.33044, + "nauc_precision_at_1_std": 0.005843, + "nauc_precision_at_1_diff1": 0.450283, + "nauc_precision_at_3_max": 0.332231, + "nauc_precision_at_3_std": 0.001593, + "nauc_precision_at_3_diff1": 0.336512, + "nauc_precision_at_5_max": 0.34003, + "nauc_precision_at_5_std": 0.013139, + "nauc_precision_at_5_diff1": 0.304902, + "nauc_precision_at_10_max": 0.324304, + "nauc_precision_at_10_std": 0.088758, + "nauc_precision_at_10_diff1": 0.216993, + "nauc_precision_at_20_max": 0.343914, + "nauc_precision_at_20_std": 0.155824, + "nauc_precision_at_20_diff1": 0.21274, + "nauc_precision_at_100_max": 0.285921, + "nauc_precision_at_100_std": 0.281345, + "nauc_precision_at_100_diff1": 0.123098, + "nauc_precision_at_1000_max": 0.062756, + "nauc_precision_at_1000_std": 0.09984, + "nauc_precision_at_1000_diff1": -0.096926, + "nauc_mrr_at_1_max": 0.33044, + "nauc_mrr_at_1_std": 0.005843, + "nauc_mrr_at_1_diff1": 0.450283, + "nauc_mrr_at_3_max": 0.329489, + "nauc_mrr_at_3_std": 0.007112, + "nauc_mrr_at_3_diff1": 0.393486, + "nauc_mrr_at_5_max": 0.32727, + "nauc_mrr_at_5_std": 0.009019, + "nauc_mrr_at_5_diff1": 0.385172, + "nauc_mrr_at_10_max": 0.330199, + "nauc_mrr_at_10_std": 0.01799, + "nauc_mrr_at_10_diff1": 0.37617, + "nauc_mrr_at_20_max": 0.330626, + "nauc_mrr_at_20_std": 0.02222, + "nauc_mrr_at_20_diff1": 0.377014, + "nauc_mrr_at_100_max": 0.330107, + "nauc_mrr_at_100_std": 0.024293, + "nauc_mrr_at_100_diff1": 0.377752, + "nauc_mrr_at_1000_max": 0.330208, + "nauc_mrr_at_1000_std": 0.023889, + "nauc_mrr_at_1000_diff1": 0.37806, + "main_score": 0.35556, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 6.588428020477295, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ClimateFEVER.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ClimateFEVER.json new file mode 100644 index 0000000000..45911c0f1a --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ClimateFEVER.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "47f2ac6acb640fc46020b02a5b59fdda04d39380", + "task_name": "ClimateFEVER", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.46384, + "ndcg_at_3": 0.40277, + "ndcg_at_5": 0.41973, + "ndcg_at_10": 0.459, + "ndcg_at_20": 0.49014, + "ndcg_at_100": 0.53309, + "ndcg_at_1000": 0.55646, + "map_at_1": 0.20224, + "map_at_3": 0.30602, + "map_at_5": 0.33365, + "map_at_10": 0.35642, + "map_at_20": 0.36924, + "map_at_100": 0.37908, + "map_at_1000": 0.38065, + "recall_at_1": 0.20224, + "recall_at_3": 0.36317, + "recall_at_5": 0.42872, + "recall_at_10": 0.51494, + "recall_at_20": 0.59991, + "recall_at_100": 0.76117, + "recall_at_1000": 0.88752, + "precision_at_1": 0.46384, + "precision_at_3": 0.30662, + "precision_at_5": 0.22515, + "precision_at_10": 0.13954, + "precision_at_20": 0.08388, + "precision_at_100": 0.02205, + "precision_at_1000": 0.00265, + "mrr_at_1": 0.463844, + "mrr_at_3": 0.562975, + "mrr_at_5": 0.57721, + "mrr_at_10": 0.586005, + "mrr_at_20": 0.590034, + "mrr_at_100": 0.592011, + "mrr_at_1000": 0.592151, + "nauc_ndcg_at_1_max": 0.377028, + "nauc_ndcg_at_1_std": 0.18271, + "nauc_ndcg_at_1_diff1": 0.346525, + "nauc_ndcg_at_3_max": 0.390647, + "nauc_ndcg_at_3_std": 0.211929, + "nauc_ndcg_at_3_diff1": 0.254853, + "nauc_ndcg_at_5_max": 0.408797, + "nauc_ndcg_at_5_std": 0.229247, + "nauc_ndcg_at_5_diff1": 0.248733, + "nauc_ndcg_at_10_max": 0.438198, + "nauc_ndcg_at_10_std": 0.267543, + "nauc_ndcg_at_10_diff1": 0.240925, + "nauc_ndcg_at_20_max": 0.447398, + "nauc_ndcg_at_20_std": 0.288742, + "nauc_ndcg_at_20_diff1": 0.235086, + "nauc_ndcg_at_100_max": 0.451401, + "nauc_ndcg_at_100_std": 0.299395, + "nauc_ndcg_at_100_diff1": 0.239796, + "nauc_ndcg_at_1000_max": 0.452058, + "nauc_ndcg_at_1000_std": 0.299975, + "nauc_ndcg_at_1000_diff1": 0.242043, + "nauc_map_at_1_max": 0.313144, + "nauc_map_at_1_std": 0.048731, + "nauc_map_at_1_diff1": 0.360524, + "nauc_map_at_3_max": 0.365831, + "nauc_map_at_3_std": 0.156916, + "nauc_map_at_3_diff1": 0.271045, + "nauc_map_at_5_max": 0.388451, + "nauc_map_at_5_std": 0.193094, + "nauc_map_at_5_diff1": 0.256488, + "nauc_map_at_10_max": 0.406898, + "nauc_map_at_10_std": 0.217308, + "nauc_map_at_10_diff1": 0.250863, + "nauc_map_at_20_max": 0.412758, + "nauc_map_at_20_std": 0.228126, + "nauc_map_at_20_diff1": 0.247874, + "nauc_map_at_100_max": 0.414296, + "nauc_map_at_100_std": 0.232293, + "nauc_map_at_100_diff1": 0.248248, + "nauc_map_at_1000_max": 0.414327, + "nauc_map_at_1000_std": 0.232519, + "nauc_map_at_1000_diff1": 0.248107, + "nauc_recall_at_1_max": 0.313144, + "nauc_recall_at_1_std": 0.048731, + "nauc_recall_at_1_diff1": 0.360524, + "nauc_recall_at_3_max": 0.355722, + "nauc_recall_at_3_std": 0.176274, + "nauc_recall_at_3_diff1": 0.217028, + "nauc_recall_at_5_max": 0.381205, + "nauc_recall_at_5_std": 0.22543, + "nauc_recall_at_5_diff1": 0.184007, + "nauc_recall_at_10_max": 0.424925, + "nauc_recall_at_10_std": 0.292063, + "nauc_recall_at_10_diff1": 0.154105, + "nauc_recall_at_20_max": 0.437144, + "nauc_recall_at_20_std": 0.340744, + "nauc_recall_at_20_diff1": 0.128004, + "nauc_recall_at_100_max": 0.4509, + "nauc_recall_at_100_std": 0.396739, + "nauc_recall_at_100_diff1": 0.124778, + "nauc_recall_at_1000_max": 0.531124, + "nauc_recall_at_1000_std": 0.515624, + "nauc_recall_at_1000_diff1": 0.105779, + "nauc_precision_at_1_max": 0.377028, + "nauc_precision_at_1_std": 0.18271, + "nauc_precision_at_1_diff1": 0.346525, + "nauc_precision_at_3_max": 0.388766, + "nauc_precision_at_3_std": 0.324869, + "nauc_precision_at_3_diff1": 0.124161, + "nauc_precision_at_5_max": 0.38372, + "nauc_precision_at_5_std": 0.364059, + "nauc_precision_at_5_diff1": 0.05956, + "nauc_precision_at_10_max": 0.383169, + "nauc_precision_at_10_std": 0.407997, + "nauc_precision_at_10_diff1": 0.019062, + "nauc_precision_at_20_max": 0.337971, + "nauc_precision_at_20_std": 0.416671, + "nauc_precision_at_20_diff1": -0.028413, + "nauc_precision_at_100_max": 0.224083, + "nauc_precision_at_100_std": 0.366276, + "nauc_precision_at_100_diff1": -0.078618, + "nauc_precision_at_1000_max": 0.094634, + "nauc_precision_at_1000_std": 0.282103, + "nauc_precision_at_1000_diff1": -0.134667, + "nauc_mrr_at_1_max": 0.377028, + "nauc_mrr_at_1_std": 0.18271, + "nauc_mrr_at_1_diff1": 0.346525, + "nauc_mrr_at_3_max": 0.405693, + "nauc_mrr_at_3_std": 0.240808, + "nauc_mrr_at_3_diff1": 0.304528, + "nauc_mrr_at_5_max": 0.408848, + "nauc_mrr_at_5_std": 0.243238, + "nauc_mrr_at_5_diff1": 0.302646, + "nauc_mrr_at_10_max": 0.412905, + "nauc_mrr_at_10_std": 0.247973, + "nauc_mrr_at_10_diff1": 0.303637, + "nauc_mrr_at_20_max": 0.413406, + "nauc_mrr_at_20_std": 0.249205, + "nauc_mrr_at_20_diff1": 0.304402, + "nauc_mrr_at_100_max": 0.412284, + "nauc_mrr_at_100_std": 0.247635, + "nauc_mrr_at_100_diff1": 0.305191, + "nauc_mrr_at_1000_max": 0.412179, + "nauc_mrr_at_1000_std": 0.247463, + "nauc_mrr_at_1000_diff1": 0.305237, + "main_score": 0.459, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 469.9892590045929, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeFeedbackMT.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeFeedbackMT.json new file mode 100644 index 0000000000..3a88d5d687 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeFeedbackMT.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "b0f12fa0c0dd67f59c95a5c33d02aeeb4c398c5f", + "task_name": "CodeFeedbackMT", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.78, + "ndcg_at_3": 0.83827, + "ndcg_at_5": 0.84963, + "ndcg_at_10": 0.85812, + "ndcg_at_20": 0.86277, + "ndcg_at_100": 0.86825, + "ndcg_at_1000": 0.87036, + "map_at_1": 0.78, + "map_at_3": 0.8245, + "map_at_5": 0.83082, + "map_at_10": 0.83434, + "map_at_20": 0.83562, + "map_at_100": 0.83639, + "map_at_1000": 0.83647, + "recall_at_1": 0.78, + "recall_at_3": 0.87791, + "recall_at_5": 0.9054, + "recall_at_10": 0.93161, + "recall_at_20": 0.94991, + "recall_at_100": 0.97936, + "recall_at_1000": 0.99586, + "precision_at_1": 0.78, + "precision_at_3": 0.29264, + "precision_at_5": 0.18108, + "precision_at_10": 0.09316, + "precision_at_20": 0.0475, + "precision_at_100": 0.00979, + "precision_at_1000": 0.001, + "mrr_at_1": 0.779995, + "mrr_at_3": 0.824496, + "mrr_at_5": 0.830819, + "mrr_at_10": 0.834335, + "mrr_at_20": 0.835622, + "mrr_at_100": 0.836386, + "mrr_at_1000": 0.836467, + "nauc_ndcg_at_1_max": 0.418151, + "nauc_ndcg_at_1_std": -0.357471, + "nauc_ndcg_at_1_diff1": 0.853951, + "nauc_ndcg_at_3_max": 0.408541, + "nauc_ndcg_at_3_std": -0.420857, + "nauc_ndcg_at_3_diff1": 0.838604, + "nauc_ndcg_at_5_max": 0.403733, + "nauc_ndcg_at_5_std": -0.425735, + "nauc_ndcg_at_5_diff1": 0.835976, + "nauc_ndcg_at_10_max": 0.401867, + "nauc_ndcg_at_10_std": -0.416429, + "nauc_ndcg_at_10_diff1": 0.837844, + "nauc_ndcg_at_20_max": 0.4, + "nauc_ndcg_at_20_std": -0.413122, + "nauc_ndcg_at_20_diff1": 0.838731, + "nauc_ndcg_at_100_max": 0.404562, + "nauc_ndcg_at_100_std": -0.403925, + "nauc_ndcg_at_100_diff1": 0.83952, + "nauc_ndcg_at_1000_max": 0.407171, + "nauc_ndcg_at_1000_std": -0.402463, + "nauc_ndcg_at_1000_diff1": 0.84029, + "nauc_map_at_1_max": 0.418151, + "nauc_map_at_1_std": -0.357471, + "nauc_map_at_1_diff1": 0.853951, + "nauc_map_at_3_max": 0.411446, + "nauc_map_at_3_std": -0.40314, + "nauc_map_at_3_diff1": 0.842662, + "nauc_map_at_5_max": 0.408902, + "nauc_map_at_5_std": -0.405007, + "nauc_map_at_5_diff1": 0.84141, + "nauc_map_at_10_max": 0.408261, + "nauc_map_at_10_std": -0.401356, + "nauc_map_at_10_diff1": 0.842218, + "nauc_map_at_20_max": 0.407835, + "nauc_map_at_20_std": -0.400433, + "nauc_map_at_20_diff1": 0.84244, + "nauc_map_at_100_max": 0.408239, + "nauc_map_at_100_std": -0.399343, + "nauc_map_at_100_diff1": 0.842572, + "nauc_map_at_1000_max": 0.408368, + "nauc_map_at_1000_std": -0.399256, + "nauc_map_at_1000_diff1": 0.842592, + "nauc_recall_at_1_max": 0.418151, + "nauc_recall_at_1_std": -0.357471, + "nauc_recall_at_1_diff1": 0.853951, + "nauc_recall_at_3_max": 0.396961, + "nauc_recall_at_3_std": -0.490678, + "nauc_recall_at_3_diff1": 0.822754, + "nauc_recall_at_5_max": 0.378116, + "nauc_recall_at_5_std": -0.526213, + "nauc_recall_at_5_diff1": 0.809618, + "nauc_recall_at_10_max": 0.358159, + "nauc_recall_at_10_std": -0.506665, + "nauc_recall_at_10_diff1": 0.810594, + "nauc_recall_at_20_max": 0.324239, + "nauc_recall_at_20_std": -0.50663, + "nauc_recall_at_20_diff1": 0.810123, + "nauc_recall_at_100_max": 0.378219, + "nauc_recall_at_100_std": -0.342852, + "nauc_recall_at_100_diff1": 0.791616, + "nauc_recall_at_1000_max": 0.782015, + "nauc_recall_at_1000_std": 0.156545, + "nauc_recall_at_1000_diff1": 0.787718, + "nauc_precision_at_1_max": 0.418151, + "nauc_precision_at_1_std": -0.357471, + "nauc_precision_at_1_diff1": 0.853951, + "nauc_precision_at_3_max": 0.396961, + "nauc_precision_at_3_std": -0.490678, + "nauc_precision_at_3_diff1": 0.822754, + "nauc_precision_at_5_max": 0.378116, + "nauc_precision_at_5_std": -0.526213, + "nauc_precision_at_5_diff1": 0.809618, + "nauc_precision_at_10_max": 0.358159, + "nauc_precision_at_10_std": -0.506665, + "nauc_precision_at_10_diff1": 0.810594, + "nauc_precision_at_20_max": 0.324239, + "nauc_precision_at_20_std": -0.50663, + "nauc_precision_at_20_diff1": 0.810123, + "nauc_precision_at_100_max": 0.378219, + "nauc_precision_at_100_std": -0.342852, + "nauc_precision_at_100_diff1": 0.791616, + "nauc_precision_at_1000_max": 0.782015, + "nauc_precision_at_1000_std": 0.156545, + "nauc_precision_at_1000_diff1": 0.787718, + "nauc_mrr_at_1_max": 0.418151, + "nauc_mrr_at_1_std": -0.357471, + "nauc_mrr_at_1_diff1": 0.853951, + "nauc_mrr_at_3_max": 0.411446, + "nauc_mrr_at_3_std": -0.40314, + "nauc_mrr_at_3_diff1": 0.842662, + "nauc_mrr_at_5_max": 0.408902, + "nauc_mrr_at_5_std": -0.405007, + "nauc_mrr_at_5_diff1": 0.84141, + "nauc_mrr_at_10_max": 0.408261, + "nauc_mrr_at_10_std": -0.401356, + "nauc_mrr_at_10_diff1": 0.842218, + "nauc_mrr_at_20_max": 0.407835, + "nauc_mrr_at_20_std": -0.400433, + "nauc_mrr_at_20_diff1": 0.84244, + "nauc_mrr_at_100_max": 0.408239, + "nauc_mrr_at_100_std": -0.399343, + "nauc_mrr_at_100_diff1": 0.842572, + "nauc_mrr_at_1000_max": 0.408368, + "nauc_mrr_at_1000_std": -0.399256, + "nauc_mrr_at_1000_diff1": 0.842592, + "main_score": 0.85812, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 73.83928275108337, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeFeedbackST.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeFeedbackST.json new file mode 100644 index 0000000000..ceab25516c --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeFeedbackST.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "d213819e87aab9010628da8b73ab4eb337c89340", + "task_name": "CodeFeedbackST", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.72449, + "ndcg_at_3": 0.83111, + "ndcg_at_5": 0.84651, + "ndcg_at_10": 0.85462, + "ndcg_at_20": 0.85802, + "ndcg_at_100": 0.86098, + "ndcg_at_1000": 0.8616, + "map_at_1": 0.72449, + "map_at_3": 0.80609, + "map_at_5": 0.81472, + "map_at_10": 0.81815, + "map_at_20": 0.8191, + "map_at_100": 0.81953, + "map_at_1000": 0.81956, + "recall_at_1": 0.72449, + "recall_at_3": 0.90302, + "recall_at_5": 0.94008, + "recall_at_10": 0.9647, + "recall_at_20": 0.97799, + "recall_at_100": 0.99374, + "recall_at_1000": 0.99847, + "precision_at_1": 0.72449, + "precision_at_3": 0.30101, + "precision_at_5": 0.18802, + "precision_at_10": 0.09647, + "precision_at_20": 0.0489, + "precision_at_100": 0.00994, + "precision_at_1000": 0.001, + "mrr_at_1": 0.723855, + "mrr_at_3": 0.805724, + "mrr_at_5": 0.81444, + "mrr_at_10": 0.817854, + "mrr_at_20": 0.818801, + "mrr_at_100": 0.819228, + "mrr_at_1000": 0.819254, + "nauc_ndcg_at_1_max": 0.151084, + "nauc_ndcg_at_1_std": -0.420744, + "nauc_ndcg_at_1_diff1": 0.81925, + "nauc_ndcg_at_3_max": 0.176703, + "nauc_ndcg_at_3_std": -0.501911, + "nauc_ndcg_at_3_diff1": 0.773989, + "nauc_ndcg_at_5_max": 0.174469, + "nauc_ndcg_at_5_std": -0.50319, + "nauc_ndcg_at_5_diff1": 0.778962, + "nauc_ndcg_at_10_max": 0.169372, + "nauc_ndcg_at_10_std": -0.491834, + "nauc_ndcg_at_10_diff1": 0.783562, + "nauc_ndcg_at_20_max": 0.165097, + "nauc_ndcg_at_20_std": -0.484284, + "nauc_ndcg_at_20_diff1": 0.786499, + "nauc_ndcg_at_100_max": 0.166463, + "nauc_ndcg_at_100_std": -0.47717, + "nauc_ndcg_at_100_diff1": 0.788615, + "nauc_ndcg_at_1000_max": 0.167218, + "nauc_ndcg_at_1000_std": -0.475755, + "nauc_ndcg_at_1000_diff1": 0.789055, + "nauc_map_at_1_max": 0.151084, + "nauc_map_at_1_std": -0.420744, + "nauc_map_at_1_diff1": 0.81925, + "nauc_map_at_3_max": 0.169691, + "nauc_map_at_3_std": -0.4765, + "nauc_map_at_3_diff1": 0.787464, + "nauc_map_at_5_max": 0.168316, + "nauc_map_at_5_std": -0.475937, + "nauc_map_at_5_diff1": 0.790441, + "nauc_map_at_10_max": 0.166443, + "nauc_map_at_10_std": -0.471546, + "nauc_map_at_10_diff1": 0.792217, + "nauc_map_at_20_max": 0.165501, + "nauc_map_at_20_std": -0.469747, + "nauc_map_at_20_diff1": 0.792925, + "nauc_map_at_100_max": 0.165549, + "nauc_map_at_100_std": -0.468995, + "nauc_map_at_100_diff1": 0.793191, + "nauc_map_at_1000_max": 0.165596, + "nauc_map_at_1000_std": -0.468931, + "nauc_map_at_1000_diff1": 0.793202, + "nauc_recall_at_1_max": 0.151084, + "nauc_recall_at_1_std": -0.420744, + "nauc_recall_at_1_diff1": 0.81925, + "nauc_recall_at_3_max": 0.21232, + "nauc_recall_at_3_std": -0.633876, + "nauc_recall_at_3_diff1": 0.70456, + "nauc_recall_at_5_max": 0.221348, + "nauc_recall_at_5_std": -0.720958, + "nauc_recall_at_5_diff1": 0.690235, + "nauc_recall_at_10_max": 0.196356, + "nauc_recall_at_10_std": -0.742541, + "nauc_recall_at_10_diff1": 0.681404, + "nauc_recall_at_20_max": 0.113696, + "nauc_recall_at_20_std": -0.721665, + "nauc_recall_at_20_diff1": 0.686515, + "nauc_recall_at_100_max": 0.168423, + "nauc_recall_at_100_std": -0.533113, + "nauc_recall_at_100_diff1": 0.655392, + "nauc_recall_at_1000_max": 0.527359, + "nauc_recall_at_1000_std": 0.083433, + "nauc_recall_at_1000_diff1": 0.541578, + "nauc_precision_at_1_max": 0.151084, + "nauc_precision_at_1_std": -0.420744, + "nauc_precision_at_1_diff1": 0.81925, + "nauc_precision_at_3_max": 0.21232, + "nauc_precision_at_3_std": -0.633876, + "nauc_precision_at_3_diff1": 0.70456, + "nauc_precision_at_5_max": 0.221348, + "nauc_precision_at_5_std": -0.720958, + "nauc_precision_at_5_diff1": 0.690235, + "nauc_precision_at_10_max": 0.196356, + "nauc_precision_at_10_std": -0.742541, + "nauc_precision_at_10_diff1": 0.681404, + "nauc_precision_at_20_max": 0.113696, + "nauc_precision_at_20_std": -0.721665, + "nauc_precision_at_20_diff1": 0.686515, + "nauc_precision_at_100_max": 0.168423, + "nauc_precision_at_100_std": -0.533113, + "nauc_precision_at_100_diff1": 0.655392, + "nauc_precision_at_1000_max": 0.527359, + "nauc_precision_at_1000_std": 0.083433, + "nauc_precision_at_1000_diff1": 0.541578, + "nauc_mrr_at_1_max": 0.146991, + "nauc_mrr_at_1_std": -0.417748, + "nauc_mrr_at_1_diff1": 0.820673, + "nauc_mrr_at_3_max": 0.16567, + "nauc_mrr_at_3_std": -0.473801, + "nauc_mrr_at_3_diff1": 0.788171, + "nauc_mrr_at_5_max": 0.165192, + "nauc_mrr_at_5_std": -0.472967, + "nauc_mrr_at_5_diff1": 0.791216, + "nauc_mrr_at_10_max": 0.163052, + "nauc_mrr_at_10_std": -0.468827, + "nauc_mrr_at_10_diff1": 0.79305, + "nauc_mrr_at_20_max": 0.16209, + "nauc_mrr_at_20_std": -0.467034, + "nauc_mrr_at_20_diff1": 0.793749, + "nauc_mrr_at_100_max": 0.162124, + "nauc_mrr_at_100_std": -0.466281, + "nauc_mrr_at_100_diff1": 0.794017, + "nauc_mrr_at_1000_max": 0.162171, + "nauc_mrr_at_1000_std": -0.466217, + "nauc_mrr_at_1000_diff1": 0.794028, + "main_score": 0.85462, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 217.4161605834961, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeSearchNetCCRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeSearchNetCCRetrieval.json new file mode 100644 index 0000000000..f2f3cdeea8 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeSearchNetCCRetrieval.json @@ -0,0 +1,893 @@ +{ + "dataset_revision": "6e1effa2c03723c5fde48ee912b5ee08d4f211e8", + "task_name": "CodeSearchNetCCRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.89543, + "ndcg_at_3": 0.93489, + "ndcg_at_5": 0.93907, + "ndcg_at_10": 0.94176, + "ndcg_at_20": 0.94321, + "ndcg_at_100": 0.94485, + "ndcg_at_1000": 0.94544, + "map_at_1": 0.89543, + "map_at_3": 0.92578, + "map_at_5": 0.92813, + "map_at_10": 0.92924, + "map_at_20": 0.92964, + "map_at_100": 0.92987, + "map_at_1000": 0.92989, + "recall_at_1": 0.89543, + "recall_at_3": 0.96099, + "recall_at_5": 0.97104, + "recall_at_10": 0.97935, + "recall_at_20": 0.98512, + "recall_at_100": 0.9939, + "recall_at_1000": 0.99846, + "precision_at_1": 0.89543, + "precision_at_3": 0.32033, + "precision_at_5": 0.19421, + "precision_at_10": 0.09794, + "precision_at_20": 0.04926, + "precision_at_100": 0.00994, + "precision_at_1000": 0.001, + "mrr_at_1": 0.895361, + "mrr_at_3": 0.925794, + "mrr_at_5": 0.928104, + "mrr_at_10": 0.929219, + "mrr_at_20": 0.929616, + "mrr_at_100": 0.929848, + "mrr_at_1000": 0.929872, + "nauc_ndcg_at_1_max": 0.610107, + "nauc_ndcg_at_1_std": -0.207071, + "nauc_ndcg_at_1_diff1": 0.911606, + "nauc_ndcg_at_3_max": 0.703596, + "nauc_ndcg_at_3_std": -0.160654, + "nauc_ndcg_at_3_diff1": 0.913077, + "nauc_ndcg_at_5_max": 0.698971, + "nauc_ndcg_at_5_std": -0.150279, + "nauc_ndcg_at_5_diff1": 0.915211, + "nauc_ndcg_at_10_max": 0.692591, + "nauc_ndcg_at_10_std": -0.147063, + "nauc_ndcg_at_10_diff1": 0.914695, + "nauc_ndcg_at_20_max": 0.68762, + "nauc_ndcg_at_20_std": -0.146615, + "nauc_ndcg_at_20_diff1": 0.914395, + "nauc_ndcg_at_100_max": 0.681503, + "nauc_ndcg_at_100_std": -0.153231, + "nauc_ndcg_at_100_diff1": 0.914152, + "nauc_ndcg_at_1000_max": 0.678984, + "nauc_ndcg_at_1000_std": -0.15751, + "nauc_ndcg_at_1000_diff1": 0.913963, + "nauc_map_at_1_max": 0.610107, + "nauc_map_at_1_std": -0.207071, + "nauc_map_at_1_diff1": 0.911606, + "nauc_map_at_3_max": 0.675689, + "nauc_map_at_3_std": -0.176294, + "nauc_map_at_3_diff1": 0.912507, + "nauc_map_at_5_max": 0.672621, + "nauc_map_at_5_std": -0.171778, + "nauc_map_at_5_diff1": 0.91355, + "nauc_map_at_10_max": 0.670022, + "nauc_map_at_10_std": -0.170918, + "nauc_map_at_10_diff1": 0.913324, + "nauc_map_at_20_max": 0.668797, + "nauc_map_at_20_std": -0.170907, + "nauc_map_at_20_diff1": 0.913253, + "nauc_map_at_100_max": 0.668067, + "nauc_map_at_100_std": -0.171569, + "nauc_map_at_100_diff1": 0.913224, + "nauc_map_at_1000_max": 0.667983, + "nauc_map_at_1000_std": -0.17169, + "nauc_map_at_1000_diff1": 0.91322, + "nauc_recall_at_1_max": 0.610107, + "nauc_recall_at_1_std": -0.207071, + "nauc_recall_at_1_diff1": 0.911606, + "nauc_recall_at_3_max": 0.853208, + "nauc_recall_at_3_std": -0.075223, + "nauc_recall_at_3_diff1": 0.916246, + "nauc_recall_at_5_max": 0.881384, + "nauc_recall_at_5_std": 0.00578, + "nauc_recall_at_5_diff1": 0.927631, + "nauc_recall_at_10_max": 0.899594, + "nauc_recall_at_10_std": 0.094533, + "nauc_recall_at_10_diff1": 0.928584, + "nauc_recall_at_20_max": 0.904845, + "nauc_recall_at_20_std": 0.192975, + "nauc_recall_at_20_diff1": 0.929329, + "nauc_recall_at_100_max": 0.921378, + "nauc_recall_at_100_std": 0.339795, + "nauc_recall_at_100_diff1": 0.938667, + "nauc_recall_at_1000_max": 0.943673, + "nauc_recall_at_1000_std": 0.590875, + "nauc_recall_at_1000_diff1": 0.957171, + "nauc_precision_at_1_max": 0.610107, + "nauc_precision_at_1_std": -0.207071, + "nauc_precision_at_1_diff1": 0.911606, + "nauc_precision_at_3_max": 0.853208, + "nauc_precision_at_3_std": -0.075223, + "nauc_precision_at_3_diff1": 0.916246, + "nauc_precision_at_5_max": 0.881384, + "nauc_precision_at_5_std": 0.00578, + "nauc_precision_at_5_diff1": 0.927631, + "nauc_precision_at_10_max": 0.899594, + "nauc_precision_at_10_std": 0.094533, + "nauc_precision_at_10_diff1": 0.928584, + "nauc_precision_at_20_max": 0.904845, + "nauc_precision_at_20_std": 0.192975, + "nauc_precision_at_20_diff1": 0.929329, + "nauc_precision_at_100_max": 0.921378, + "nauc_precision_at_100_std": 0.339795, + "nauc_precision_at_100_diff1": 0.938667, + "nauc_precision_at_1000_max": 0.943673, + "nauc_precision_at_1000_std": 0.590875, + "nauc_precision_at_1000_diff1": 0.957171, + "nauc_mrr_at_1_max": 0.610306, + "nauc_mrr_at_1_std": -0.204897, + "nauc_mrr_at_1_diff1": 0.91174, + "nauc_mrr_at_3_max": 0.675601, + "nauc_mrr_at_3_std": -0.175001, + "nauc_mrr_at_3_diff1": 0.912632, + "nauc_mrr_at_5_max": 0.672588, + "nauc_mrr_at_5_std": -0.170874, + "nauc_mrr_at_5_diff1": 0.913654, + "nauc_mrr_at_10_max": 0.670013, + "nauc_mrr_at_10_std": -0.16954, + "nauc_mrr_at_10_diff1": 0.913425, + "nauc_mrr_at_20_max": 0.668804, + "nauc_mrr_at_20_std": -0.16955, + "nauc_mrr_at_20_diff1": 0.913352, + "nauc_mrr_at_100_max": 0.66806, + "nauc_mrr_at_100_std": -0.170176, + "nauc_mrr_at_100_diff1": 0.913326, + "nauc_mrr_at_1000_max": 0.667974, + "nauc_mrr_at_1000_std": -0.170308, + "nauc_mrr_at_1000_diff1": 0.91332, + "main_score": 0.94176, + "hf_subset": "python", + "languages": [ + "python-Code" + ] + }, + { + "ndcg_at_1": 0.89942, + "ndcg_at_3": 0.94003, + "ndcg_at_5": 0.94406, + "ndcg_at_10": 0.9457, + "ndcg_at_20": 0.94716, + "ndcg_at_100": 0.94882, + "ndcg_at_1000": 0.94934, + "map_at_1": 0.89942, + "map_at_3": 0.93067, + "map_at_5": 0.93292, + "map_at_10": 0.93357, + "map_at_20": 0.93398, + "map_at_100": 0.93424, + "map_at_1000": 0.93426, + "recall_at_1": 0.89942, + "recall_at_3": 0.96688, + "recall_at_5": 0.9766, + "recall_at_10": 0.98177, + "recall_at_20": 0.98754, + "recall_at_100": 0.99605, + "recall_at_1000": 1.0, + "precision_at_1": 0.89942, + "precision_at_3": 0.32229, + "precision_at_5": 0.19532, + "precision_at_10": 0.09818, + "precision_at_20": 0.04938, + "precision_at_100": 0.00996, + "precision_at_1000": 0.001, + "mrr_at_1": 0.898511, + "mrr_at_3": 0.930062, + "mrr_at_5": 0.932386, + "mrr_at_10": 0.933039, + "mrr_at_20": 0.933444, + "mrr_at_100": 0.933706, + "mrr_at_1000": 0.933727, + "nauc_ndcg_at_1_max": 0.588526, + "nauc_ndcg_at_1_std": -0.246338, + "nauc_ndcg_at_1_diff1": 0.897452, + "nauc_ndcg_at_3_max": 0.693094, + "nauc_ndcg_at_3_std": -0.22222, + "nauc_ndcg_at_3_diff1": 0.899362, + "nauc_ndcg_at_5_max": 0.679282, + "nauc_ndcg_at_5_std": -0.210191, + "nauc_ndcg_at_5_diff1": 0.894873, + "nauc_ndcg_at_10_max": 0.677325, + "nauc_ndcg_at_10_std": -0.210501, + "nauc_ndcg_at_10_diff1": 0.898172, + "nauc_ndcg_at_20_max": 0.674156, + "nauc_ndcg_at_20_std": -0.214564, + "nauc_ndcg_at_20_diff1": 0.898588, + "nauc_ndcg_at_100_max": 0.664618, + "nauc_ndcg_at_100_std": -0.216228, + "nauc_ndcg_at_100_diff1": 0.897315, + "nauc_ndcg_at_1000_max": 0.661802, + "nauc_ndcg_at_1000_std": -0.219294, + "nauc_ndcg_at_1000_diff1": 0.89744, + "nauc_map_at_1_max": 0.588526, + "nauc_map_at_1_std": -0.246338, + "nauc_map_at_1_diff1": 0.897452, + "nauc_map_at_3_max": 0.661935, + "nauc_map_at_3_std": -0.230564, + "nauc_map_at_3_diff1": 0.898423, + "nauc_map_at_5_max": 0.654505, + "nauc_map_at_5_std": -0.225048, + "nauc_map_at_5_diff1": 0.896338, + "nauc_map_at_10_max": 0.653524, + "nauc_map_at_10_std": -0.225013, + "nauc_map_at_10_diff1": 0.897314, + "nauc_map_at_20_max": 0.652835, + "nauc_map_at_20_std": -0.225739, + "nauc_map_at_20_diff1": 0.897471, + "nauc_map_at_100_max": 0.651567, + "nauc_map_at_100_std": -0.226055, + "nauc_map_at_100_diff1": 0.897304, + "nauc_map_at_1000_max": 0.651475, + "nauc_map_at_1000_std": -0.226066, + "nauc_map_at_1000_diff1": 0.897309, + "nauc_recall_at_1_max": 0.588526, + "nauc_recall_at_1_std": -0.246338, + "nauc_recall_at_1_diff1": 0.897452, + "nauc_recall_at_3_max": 0.876525, + "nauc_recall_at_3_std": -0.171922, + "nauc_recall_at_3_diff1": 0.905265, + "nauc_recall_at_5_max": 0.872559, + "nauc_recall_at_5_std": -0.083958, + "nauc_recall_at_5_diff1": 0.881385, + "nauc_recall_at_10_max": 0.910797, + "nauc_recall_at_10_std": -0.056518, + "nauc_recall_at_10_diff1": 0.910881, + "nauc_recall_at_20_max": 0.960035, + "nauc_recall_at_20_std": -0.063654, + "nauc_recall_at_20_diff1": 0.92098, + "nauc_recall_at_100_max": 0.945597, + "nauc_recall_at_100_std": 0.16223, + "nauc_recall_at_100_diff1": 0.885626, + "nauc_recall_at_1000_max": NaN, + "nauc_recall_at_1000_std": NaN, + "nauc_recall_at_1000_diff1": NaN, + "nauc_precision_at_1_max": 0.588526, + "nauc_precision_at_1_std": -0.246338, + "nauc_precision_at_1_diff1": 0.897452, + "nauc_precision_at_3_max": 0.876525, + "nauc_precision_at_3_std": -0.171922, + "nauc_precision_at_3_diff1": 0.905265, + "nauc_precision_at_5_max": 0.872559, + "nauc_precision_at_5_std": -0.083958, + "nauc_precision_at_5_diff1": 0.881385, + "nauc_precision_at_10_max": 0.910797, + "nauc_precision_at_10_std": -0.056518, + "nauc_precision_at_10_diff1": 0.910881, + "nauc_precision_at_20_max": 0.960035, + "nauc_precision_at_20_std": -0.063654, + "nauc_precision_at_20_diff1": 0.92098, + "nauc_precision_at_100_max": 0.945597, + "nauc_precision_at_100_std": 0.16223, + "nauc_precision_at_100_diff1": 0.885626, + "nauc_precision_at_1000_max": NaN, + "nauc_precision_at_1000_std": NaN, + "nauc_precision_at_1000_diff1": NaN, + "nauc_mrr_at_1_max": 0.577547, + "nauc_mrr_at_1_std": -0.247307, + "nauc_mrr_at_1_diff1": 0.89943, + "nauc_mrr_at_3_max": 0.653323, + "nauc_mrr_at_3_std": -0.232934, + "nauc_mrr_at_3_diff1": 0.900074, + "nauc_mrr_at_5_max": 0.645769, + "nauc_mrr_at_5_std": -0.226502, + "nauc_mrr_at_5_diff1": 0.897946, + "nauc_mrr_at_10_max": 0.644709, + "nauc_mrr_at_10_std": -0.226481, + "nauc_mrr_at_10_diff1": 0.89893, + "nauc_mrr_at_20_max": 0.643971, + "nauc_mrr_at_20_std": -0.227211, + "nauc_mrr_at_20_diff1": 0.899096, + "nauc_mrr_at_100_max": 0.642678, + "nauc_mrr_at_100_std": -0.22753, + "nauc_mrr_at_100_diff1": 0.898937, + "nauc_mrr_at_1000_max": 0.642584, + "nauc_mrr_at_1000_std": -0.227542, + "nauc_mrr_at_1000_diff1": 0.898942, + "main_score": 0.9457, + "hf_subset": "javascript", + "languages": [ + "javascript-Code" + ] + }, + { + "ndcg_at_1": 0.9036, + "ndcg_at_3": 0.93909, + "ndcg_at_5": 0.94379, + "ndcg_at_10": 0.94688, + "ndcg_at_20": 0.94853, + "ndcg_at_100": 0.94995, + "ndcg_at_1000": 0.95021, + "map_at_1": 0.9036, + "map_at_3": 0.93083, + "map_at_5": 0.93342, + "map_at_10": 0.93471, + "map_at_20": 0.93518, + "map_at_100": 0.9354, + "map_at_1000": 0.93541, + "recall_at_1": 0.9036, + "recall_at_3": 0.96282, + "recall_at_5": 0.97427, + "recall_at_10": 0.98375, + "recall_at_20": 0.99015, + "recall_at_100": 0.99754, + "recall_at_1000": 0.99951, + "precision_at_1": 0.9036, + "precision_at_3": 0.32094, + "precision_at_5": 0.19485, + "precision_at_10": 0.09837, + "precision_at_20": 0.04951, + "precision_at_100": 0.00998, + "precision_at_1000": 0.001, + "mrr_at_1": 0.904334, + "mrr_at_3": 0.930949, + "mrr_at_5": 0.933602, + "mrr_at_10": 0.934884, + "mrr_at_20": 0.935348, + "mrr_at_100": 0.935585, + "mrr_at_1000": 0.935596, + "nauc_ndcg_at_1_max": 0.553241, + "nauc_ndcg_at_1_std": -0.435368, + "nauc_ndcg_at_1_diff1": 0.917461, + "nauc_ndcg_at_3_max": 0.609835, + "nauc_ndcg_at_3_std": -0.477706, + "nauc_ndcg_at_3_diff1": 0.920705, + "nauc_ndcg_at_5_max": 0.607661, + "nauc_ndcg_at_5_std": -0.474195, + "nauc_ndcg_at_5_diff1": 0.921142, + "nauc_ndcg_at_10_max": 0.607731, + "nauc_ndcg_at_10_std": -0.462237, + "nauc_ndcg_at_10_diff1": 0.920395, + "nauc_ndcg_at_20_max": 0.608023, + "nauc_ndcg_at_20_std": -0.451622, + "nauc_ndcg_at_20_diff1": 0.920286, + "nauc_ndcg_at_100_max": 0.599593, + "nauc_ndcg_at_100_std": -0.455073, + "nauc_ndcg_at_100_diff1": 0.92036, + "nauc_ndcg_at_1000_max": 0.598116, + "nauc_ndcg_at_1000_std": -0.456732, + "nauc_ndcg_at_1000_diff1": 0.920119, + "nauc_map_at_1_max": 0.553241, + "nauc_map_at_1_std": -0.435368, + "nauc_map_at_1_diff1": 0.917461, + "nauc_map_at_3_max": 0.593745, + "nauc_map_at_3_std": -0.466419, + "nauc_map_at_3_diff1": 0.919783, + "nauc_map_at_5_max": 0.59219, + "nauc_map_at_5_std": -0.464452, + "nauc_map_at_5_diff1": 0.919936, + "nauc_map_at_10_max": 0.591895, + "nauc_map_at_10_std": -0.46057, + "nauc_map_at_10_diff1": 0.919689, + "nauc_map_at_20_max": 0.591778, + "nauc_map_at_20_std": -0.458156, + "nauc_map_at_20_diff1": 0.919659, + "nauc_map_at_100_max": 0.590763, + "nauc_map_at_100_std": -0.458411, + "nauc_map_at_100_diff1": 0.919685, + "nauc_map_at_1000_max": 0.590714, + "nauc_map_at_1000_std": -0.458437, + "nauc_map_at_1000_diff1": 0.919677, + "nauc_recall_at_1_max": 0.553241, + "nauc_recall_at_1_std": -0.435368, + "nauc_recall_at_1_diff1": 0.917461, + "nauc_recall_at_3_max": 0.693966, + "nauc_recall_at_3_std": -0.536037, + "nauc_recall_at_3_diff1": 0.925522, + "nauc_recall_at_5_max": 0.718888, + "nauc_recall_at_5_std": -0.542112, + "nauc_recall_at_5_diff1": 0.930153, + "nauc_recall_at_10_max": 0.784731, + "nauc_recall_at_10_std": -0.454203, + "nauc_recall_at_10_diff1": 0.927286, + "nauc_recall_at_20_max": 0.908983, + "nauc_recall_at_20_std": -0.23405, + "nauc_recall_at_20_diff1": 0.929565, + "nauc_recall_at_100_max": 0.908755, + "nauc_recall_at_100_std": -0.012286, + "nauc_recall_at_100_diff1": 0.959152, + "nauc_recall_at_1000_max": 1.0, + "nauc_recall_at_1000_std": 0.274743, + "nauc_recall_at_1000_diff1": 0.930559, + "nauc_precision_at_1_max": 0.553241, + "nauc_precision_at_1_std": -0.435368, + "nauc_precision_at_1_diff1": 0.917461, + "nauc_precision_at_3_max": 0.693966, + "nauc_precision_at_3_std": -0.536037, + "nauc_precision_at_3_diff1": 0.925522, + "nauc_precision_at_5_max": 0.718888, + "nauc_precision_at_5_std": -0.542112, + "nauc_precision_at_5_diff1": 0.930153, + "nauc_precision_at_10_max": 0.784731, + "nauc_precision_at_10_std": -0.454203, + "nauc_precision_at_10_diff1": 0.927286, + "nauc_precision_at_20_max": 0.908983, + "nauc_precision_at_20_std": -0.23405, + "nauc_precision_at_20_diff1": 0.929565, + "nauc_precision_at_100_max": 0.908755, + "nauc_precision_at_100_std": -0.012286, + "nauc_precision_at_100_diff1": 0.959152, + "nauc_precision_at_1000_max": 1.0, + "nauc_precision_at_1000_std": 0.274743, + "nauc_precision_at_1000_diff1": 0.930559, + "nauc_mrr_at_1_max": 0.562297, + "nauc_mrr_at_1_std": -0.435478, + "nauc_mrr_at_1_diff1": 0.916824, + "nauc_mrr_at_3_max": 0.598381, + "nauc_mrr_at_3_std": -0.469024, + "nauc_mrr_at_3_diff1": 0.919831, + "nauc_mrr_at_5_max": 0.597188, + "nauc_mrr_at_5_std": -0.466365, + "nauc_mrr_at_5_diff1": 0.919919, + "nauc_mrr_at_10_max": 0.59704, + "nauc_mrr_at_10_std": -0.463444, + "nauc_mrr_at_10_diff1": 0.919682, + "nauc_mrr_at_20_max": 0.596742, + "nauc_mrr_at_20_std": -0.461091, + "nauc_mrr_at_20_diff1": 0.919636, + "nauc_mrr_at_100_max": 0.596128, + "nauc_mrr_at_100_std": -0.460937, + "nauc_mrr_at_100_diff1": 0.919647, + "nauc_mrr_at_1000_max": 0.59608, + "nauc_mrr_at_1000_std": -0.460963, + "nauc_mrr_at_1000_diff1": 0.919638, + "main_score": 0.94688, + "hf_subset": "go", + "languages": [ + "go-Code" + ] + }, + { + "ndcg_at_1": 0.84933, + "ndcg_at_3": 0.89689, + "ndcg_at_5": 0.90603, + "ndcg_at_10": 0.90939, + "ndcg_at_20": 0.91298, + "ndcg_at_100": 0.91583, + "ndcg_at_1000": 0.91666, + "map_at_1": 0.84933, + "map_at_3": 0.88607, + "map_at_5": 0.89114, + "map_at_10": 0.89254, + "map_at_20": 0.89352, + "map_at_100": 0.89388, + "map_at_1000": 0.89391, + "recall_at_1": 0.84933, + "recall_at_3": 0.92784, + "recall_at_5": 0.95004, + "recall_at_10": 0.96035, + "recall_at_20": 0.97462, + "recall_at_100": 0.99048, + "recall_at_1000": 0.99683, + "precision_at_1": 0.84933, + "precision_at_3": 0.30928, + "precision_at_5": 0.19001, + "precision_at_10": 0.09603, + "precision_at_20": 0.04873, + "precision_at_100": 0.0099, + "precision_at_1000": 0.001, + "mrr_at_1": 0.851705, + "mrr_at_3": 0.886862, + "mrr_at_5": 0.892096, + "mrr_at_10": 0.893492, + "mrr_at_20": 0.894472, + "mrr_at_100": 0.89483, + "mrr_at_1000": 0.894863, + "nauc_ndcg_at_1_max": 0.671423, + "nauc_ndcg_at_1_std": -0.182023, + "nauc_ndcg_at_1_diff1": 0.915352, + "nauc_ndcg_at_3_max": 0.745344, + "nauc_ndcg_at_3_std": -0.154303, + "nauc_ndcg_at_3_diff1": 0.90122, + "nauc_ndcg_at_5_max": 0.74157, + "nauc_ndcg_at_5_std": -0.134696, + "nauc_ndcg_at_5_diff1": 0.901407, + "nauc_ndcg_at_10_max": 0.741321, + "nauc_ndcg_at_10_std": -0.148523, + "nauc_ndcg_at_10_diff1": 0.906022, + "nauc_ndcg_at_20_max": 0.737577, + "nauc_ndcg_at_20_std": -0.141653, + "nauc_ndcg_at_20_diff1": 0.906997, + "nauc_ndcg_at_100_max": 0.731047, + "nauc_ndcg_at_100_std": -0.142239, + "nauc_ndcg_at_100_diff1": 0.906022, + "nauc_ndcg_at_1000_max": 0.729055, + "nauc_ndcg_at_1000_std": -0.146599, + "nauc_ndcg_at_1000_diff1": 0.906293, + "nauc_map_at_1_max": 0.671423, + "nauc_map_at_1_std": -0.182023, + "nauc_map_at_1_diff1": 0.915352, + "nauc_map_at_3_max": 0.724025, + "nauc_map_at_3_std": -0.163193, + "nauc_map_at_3_diff1": 0.904879, + "nauc_map_at_5_max": 0.721465, + "nauc_map_at_5_std": -0.153847, + "nauc_map_at_5_diff1": 0.905063, + "nauc_map_at_10_max": 0.720657, + "nauc_map_at_10_std": -0.159086, + "nauc_map_at_10_diff1": 0.906423, + "nauc_map_at_20_max": 0.719664, + "nauc_map_at_20_std": -0.158048, + "nauc_map_at_20_diff1": 0.906681, + "nauc_map_at_100_max": 0.718957, + "nauc_map_at_100_std": -0.158288, + "nauc_map_at_100_diff1": 0.906565, + "nauc_map_at_1000_max": 0.7189, + "nauc_map_at_1000_std": -0.158381, + "nauc_map_at_1000_diff1": 0.906576, + "nauc_recall_at_1_max": 0.671423, + "nauc_recall_at_1_std": -0.182023, + "nauc_recall_at_1_diff1": 0.915352, + "nauc_recall_at_3_max": 0.838448, + "nauc_recall_at_3_std": -0.114862, + "nauc_recall_at_3_diff1": 0.885528, + "nauc_recall_at_5_max": 0.86058, + "nauc_recall_at_5_std": -0.013091, + "nauc_recall_at_5_diff1": 0.880108, + "nauc_recall_at_10_max": 0.896236, + "nauc_recall_at_10_std": -0.074284, + "nauc_recall_at_10_diff1": 0.910609, + "nauc_recall_at_20_max": 0.932606, + "nauc_recall_at_20_std": 0.070542, + "nauc_recall_at_20_diff1": 0.924947, + "nauc_recall_at_100_max": 0.944178, + "nauc_recall_at_100_std": 0.417346, + "nauc_recall_at_100_diff1": 0.910141, + "nauc_recall_at_1000_max": 0.967323, + "nauc_recall_at_1000_std": 0.626022, + "nauc_recall_at_1000_diff1": 0.967323, + "nauc_precision_at_1_max": 0.671423, + "nauc_precision_at_1_std": -0.182023, + "nauc_precision_at_1_diff1": 0.915352, + "nauc_precision_at_3_max": 0.838448, + "nauc_precision_at_3_std": -0.114862, + "nauc_precision_at_3_diff1": 0.885528, + "nauc_precision_at_5_max": 0.86058, + "nauc_precision_at_5_std": -0.013091, + "nauc_precision_at_5_diff1": 0.880108, + "nauc_precision_at_10_max": 0.896236, + "nauc_precision_at_10_std": -0.074284, + "nauc_precision_at_10_diff1": 0.910609, + "nauc_precision_at_20_max": 0.932606, + "nauc_precision_at_20_std": 0.070542, + "nauc_precision_at_20_diff1": 0.924947, + "nauc_precision_at_100_max": 0.944178, + "nauc_precision_at_100_std": 0.417346, + "nauc_precision_at_100_diff1": 0.910141, + "nauc_precision_at_1000_max": 0.967323, + "nauc_precision_at_1000_std": 0.626022, + "nauc_precision_at_1000_diff1": 0.967323, + "nauc_mrr_at_1_max": 0.683799, + "nauc_mrr_at_1_std": -0.166916, + "nauc_mrr_at_1_diff1": 0.911929, + "nauc_mrr_at_3_max": 0.731895, + "nauc_mrr_at_3_std": -0.153293, + "nauc_mrr_at_3_diff1": 0.902378, + "nauc_mrr_at_5_max": 0.729692, + "nauc_mrr_at_5_std": -0.143964, + "nauc_mrr_at_5_diff1": 0.902294, + "nauc_mrr_at_10_max": 0.728989, + "nauc_mrr_at_10_std": -0.14911, + "nauc_mrr_at_10_diff1": 0.903628, + "nauc_mrr_at_20_max": 0.728068, + "nauc_mrr_at_20_std": -0.147968, + "nauc_mrr_at_20_diff1": 0.903861, + "nauc_mrr_at_100_max": 0.727385, + "nauc_mrr_at_100_std": -0.148175, + "nauc_mrr_at_100_diff1": 0.903734, + "nauc_mrr_at_1000_max": 0.727331, + "nauc_mrr_at_1000_std": -0.148265, + "nauc_mrr_at_1000_diff1": 0.903744, + "main_score": 0.90939, + "hf_subset": "ruby", + "languages": [ + "ruby-Code" + ] + }, + { + "ndcg_at_1": 0.89877, + "ndcg_at_3": 0.93265, + "ndcg_at_5": 0.93593, + "ndcg_at_10": 0.93883, + "ndcg_at_20": 0.94013, + "ndcg_at_100": 0.94172, + "ndcg_at_1000": 0.94238, + "map_at_1": 0.89877, + "map_at_3": 0.92483, + "map_at_5": 0.92665, + "map_at_10": 0.92785, + "map_at_20": 0.92821, + "map_at_100": 0.92842, + "map_at_1000": 0.92845, + "recall_at_1": 0.89877, + "recall_at_3": 0.95509, + "recall_at_5": 0.96303, + "recall_at_10": 0.97198, + "recall_at_20": 0.97709, + "recall_at_100": 0.98585, + "recall_at_1000": 0.99087, + "precision_at_1": 0.89877, + "precision_at_3": 0.31836, + "precision_at_5": 0.19261, + "precision_at_10": 0.0972, + "precision_at_20": 0.04885, + "precision_at_100": 0.00986, + "precision_at_1000": 0.00099, + "mrr_at_1": 0.898494, + "mrr_at_3": 0.924707, + "mrr_at_5": 0.926537, + "mrr_at_10": 0.927722, + "mrr_at_20": 0.928101, + "mrr_at_100": 0.928309, + "mrr_at_1000": 0.928336, + "nauc_ndcg_at_1_max": 0.66351, + "nauc_ndcg_at_1_std": -0.145829, + "nauc_ndcg_at_1_diff1": 0.92367, + "nauc_ndcg_at_3_max": 0.766042, + "nauc_ndcg_at_3_std": -0.051467, + "nauc_ndcg_at_3_diff1": 0.930654, + "nauc_ndcg_at_5_max": 0.76298, + "nauc_ndcg_at_5_std": -0.028149, + "nauc_ndcg_at_5_diff1": 0.931129, + "nauc_ndcg_at_10_max": 0.759427, + "nauc_ndcg_at_10_std": -0.012763, + "nauc_ndcg_at_10_diff1": 0.931194, + "nauc_ndcg_at_20_max": 0.757637, + "nauc_ndcg_at_20_std": -0.005659, + "nauc_ndcg_at_20_diff1": 0.931632, + "nauc_ndcg_at_100_max": 0.75252, + "nauc_ndcg_at_100_std": -0.009525, + "nauc_ndcg_at_100_diff1": 0.93133, + "nauc_ndcg_at_1000_max": 0.749884, + "nauc_ndcg_at_1000_std": -0.016915, + "nauc_ndcg_at_1000_diff1": 0.931155, + "nauc_map_at_1_max": 0.66351, + "nauc_map_at_1_std": -0.145829, + "nauc_map_at_1_diff1": 0.92367, + "nauc_map_at_3_max": 0.736494, + "nauc_map_at_3_std": -0.081878, + "nauc_map_at_3_diff1": 0.928481, + "nauc_map_at_5_max": 0.734202, + "nauc_map_at_5_std": -0.071408, + "nauc_map_at_5_diff1": 0.928655, + "nauc_map_at_10_max": 0.73255, + "nauc_map_at_10_std": -0.066432, + "nauc_map_at_10_diff1": 0.928632, + "nauc_map_at_20_max": 0.732047, + "nauc_map_at_20_std": -0.06493, + "nauc_map_at_20_diff1": 0.928714, + "nauc_map_at_100_max": 0.731433, + "nauc_map_at_100_std": -0.065488, + "nauc_map_at_100_diff1": 0.928681, + "nauc_map_at_1000_max": 0.731338, + "nauc_map_at_1000_std": -0.065759, + "nauc_map_at_1000_diff1": 0.928671, + "nauc_recall_at_1_max": 0.66351, + "nauc_recall_at_1_std": -0.145829, + "nauc_recall_at_1_diff1": 0.92367, + "nauc_recall_at_3_max": 0.906037, + "nauc_recall_at_3_std": 0.095118, + "nauc_recall_at_3_diff1": 0.941076, + "nauc_recall_at_5_max": 0.923832, + "nauc_recall_at_5_std": 0.225264, + "nauc_recall_at_5_diff1": 0.945324, + "nauc_recall_at_10_max": 0.950286, + "nauc_recall_at_10_std": 0.405632, + "nauc_recall_at_10_diff1": 0.950363, + "nauc_recall_at_20_max": 0.973357, + "nauc_recall_at_20_std": 0.568996, + "nauc_recall_at_20_diff1": 0.959284, + "nauc_recall_at_100_max": 0.991114, + "nauc_recall_at_100_std": 0.836722, + "nauc_recall_at_100_diff1": 0.968915, + "nauc_recall_at_1000_max": 0.994234, + "nauc_recall_at_1000_std": 0.942841, + "nauc_recall_at_1000_diff1": 0.982633, + "nauc_precision_at_1_max": 0.66351, + "nauc_precision_at_1_std": -0.145829, + "nauc_precision_at_1_diff1": 0.92367, + "nauc_precision_at_3_max": 0.906037, + "nauc_precision_at_3_std": 0.095118, + "nauc_precision_at_3_diff1": 0.941076, + "nauc_precision_at_5_max": 0.923832, + "nauc_precision_at_5_std": 0.225264, + "nauc_precision_at_5_diff1": 0.945324, + "nauc_precision_at_10_max": 0.950286, + "nauc_precision_at_10_std": 0.405632, + "nauc_precision_at_10_diff1": 0.950363, + "nauc_precision_at_20_max": 0.973357, + "nauc_precision_at_20_std": 0.568996, + "nauc_precision_at_20_diff1": 0.959284, + "nauc_precision_at_100_max": 0.991114, + "nauc_precision_at_100_std": 0.836722, + "nauc_precision_at_100_diff1": 0.968915, + "nauc_precision_at_1000_max": 0.994234, + "nauc_precision_at_1000_std": 0.942841, + "nauc_precision_at_1000_diff1": 0.982633, + "nauc_mrr_at_1_max": 0.663165, + "nauc_mrr_at_1_std": -0.143855, + "nauc_mrr_at_1_diff1": 0.924202, + "nauc_mrr_at_3_max": 0.734842, + "nauc_mrr_at_3_std": -0.080853, + "nauc_mrr_at_3_diff1": 0.928645, + "nauc_mrr_at_5_max": 0.732154, + "nauc_mrr_at_5_std": -0.071311, + "nauc_mrr_at_5_diff1": 0.928896, + "nauc_mrr_at_10_max": 0.730844, + "nauc_mrr_at_10_std": -0.066459, + "nauc_mrr_at_10_diff1": 0.928913, + "nauc_mrr_at_20_max": 0.730334, + "nauc_mrr_at_20_std": -0.064591, + "nauc_mrr_at_20_diff1": 0.928981, + "nauc_mrr_at_100_max": 0.729716, + "nauc_mrr_at_100_std": -0.065147, + "nauc_mrr_at_100_diff1": 0.928949, + "nauc_mrr_at_1000_max": 0.72962, + "nauc_mrr_at_1000_std": -0.065418, + "nauc_mrr_at_1000_diff1": 0.928939, + "main_score": 0.93883, + "hf_subset": "java", + "languages": [ + "java-Code" + ] + }, + { + "ndcg_at_1": 0.86235, + "ndcg_at_3": 0.9083, + "ndcg_at_5": 0.91559, + "ndcg_at_10": 0.92061, + "ndcg_at_20": 0.92298, + "ndcg_at_100": 0.92527, + "ndcg_at_1000": 0.92603, + "map_at_1": 0.86235, + "map_at_3": 0.89759, + "map_at_5": 0.90165, + "map_at_10": 0.90375, + "map_at_20": 0.90441, + "map_at_100": 0.90475, + "map_at_1000": 0.90478, + "recall_at_1": 0.86235, + "recall_at_3": 0.93906, + "recall_at_5": 0.95669, + "recall_at_10": 0.9721, + "recall_at_20": 0.98138, + "recall_at_100": 0.99336, + "recall_at_1000": 0.99922, + "precision_at_1": 0.86235, + "precision_at_3": 0.31302, + "precision_at_5": 0.19134, + "precision_at_10": 0.09721, + "precision_at_20": 0.04907, + "precision_at_100": 0.00993, + "precision_at_1000": 0.001, + "mrr_at_1": 0.861638, + "mrr_at_3": 0.89721, + "mrr_at_5": 0.901256, + "mrr_at_10": 0.903365, + "mrr_at_20": 0.904012, + "mrr_at_100": 0.904358, + "mrr_at_1000": 0.904388, + "nauc_ndcg_at_1_max": 0.607496, + "nauc_ndcg_at_1_std": -0.306174, + "nauc_ndcg_at_1_diff1": 0.907348, + "nauc_ndcg_at_3_max": 0.683668, + "nauc_ndcg_at_3_std": -0.298904, + "nauc_ndcg_at_3_diff1": 0.89286, + "nauc_ndcg_at_5_max": 0.683616, + "nauc_ndcg_at_5_std": -0.283198, + "nauc_ndcg_at_5_diff1": 0.894383, + "nauc_ndcg_at_10_max": 0.681152, + "nauc_ndcg_at_10_std": -0.273467, + "nauc_ndcg_at_10_diff1": 0.895855, + "nauc_ndcg_at_20_max": 0.675026, + "nauc_ndcg_at_20_std": -0.271579, + "nauc_ndcg_at_20_diff1": 0.896752, + "nauc_ndcg_at_100_max": 0.668196, + "nauc_ndcg_at_100_std": -0.275205, + "nauc_ndcg_at_100_diff1": 0.896985, + "nauc_ndcg_at_1000_max": 0.665915, + "nauc_ndcg_at_1000_std": -0.280743, + "nauc_ndcg_at_1000_diff1": 0.897251, + "nauc_map_at_1_max": 0.607496, + "nauc_map_at_1_std": -0.306174, + "nauc_map_at_1_diff1": 0.907348, + "nauc_map_at_3_max": 0.661468, + "nauc_map_at_3_std": -0.300623, + "nauc_map_at_3_diff1": 0.8966, + "nauc_map_at_5_max": 0.660471, + "nauc_map_at_5_std": -0.293523, + "nauc_map_at_5_diff1": 0.897504, + "nauc_map_at_10_max": 0.659156, + "nauc_map_at_10_std": -0.290358, + "nauc_map_at_10_diff1": 0.898109, + "nauc_map_at_20_max": 0.657613, + "nauc_map_at_20_std": -0.289961, + "nauc_map_at_20_diff1": 0.898326, + "nauc_map_at_100_max": 0.656778, + "nauc_map_at_100_std": -0.290319, + "nauc_map_at_100_diff1": 0.898361, + "nauc_map_at_1000_max": 0.656709, + "nauc_map_at_1000_std": -0.290475, + "nauc_map_at_1000_diff1": 0.89837, + "nauc_recall_at_1_max": 0.607496, + "nauc_recall_at_1_std": -0.306174, + "nauc_recall_at_1_diff1": 0.907348, + "nauc_recall_at_3_max": 0.787253, + "nauc_recall_at_3_std": -0.291182, + "nauc_recall_at_3_diff1": 0.875767, + "nauc_recall_at_5_max": 0.829474, + "nauc_recall_at_5_std": -0.212254, + "nauc_recall_at_5_diff1": 0.875703, + "nauc_recall_at_10_max": 0.888071, + "nauc_recall_at_10_std": -0.090741, + "nauc_recall_at_10_diff1": 0.877468, + "nauc_recall_at_20_max": 0.894358, + "nauc_recall_at_20_std": 0.026655, + "nauc_recall_at_20_diff1": 0.882555, + "nauc_recall_at_100_max": 0.892113, + "nauc_recall_at_100_std": 0.330185, + "nauc_recall_at_100_diff1": 0.869835, + "nauc_recall_at_1000_max": 0.904507, + "nauc_recall_at_1000_std": 0.772941, + "nauc_recall_at_1000_diff1": 0.849972, + "nauc_precision_at_1_max": 0.607496, + "nauc_precision_at_1_std": -0.306174, + "nauc_precision_at_1_diff1": 0.907348, + "nauc_precision_at_3_max": 0.787253, + "nauc_precision_at_3_std": -0.291182, + "nauc_precision_at_3_diff1": 0.875767, + "nauc_precision_at_5_max": 0.829474, + "nauc_precision_at_5_std": -0.212254, + "nauc_precision_at_5_diff1": 0.875703, + "nauc_precision_at_10_max": 0.888071, + "nauc_precision_at_10_std": -0.090741, + "nauc_precision_at_10_diff1": 0.877468, + "nauc_precision_at_20_max": 0.894358, + "nauc_precision_at_20_std": 0.026655, + "nauc_precision_at_20_diff1": 0.882555, + "nauc_precision_at_100_max": 0.892113, + "nauc_precision_at_100_std": 0.330185, + "nauc_precision_at_100_diff1": 0.869835, + "nauc_precision_at_1000_max": 0.904507, + "nauc_precision_at_1000_std": 0.772941, + "nauc_precision_at_1000_diff1": 0.849972, + "nauc_mrr_at_1_max": 0.605693, + "nauc_mrr_at_1_std": -0.31083, + "nauc_mrr_at_1_diff1": 0.908478, + "nauc_mrr_at_3_max": 0.659467, + "nauc_mrr_at_3_std": -0.303792, + "nauc_mrr_at_3_diff1": 0.897312, + "nauc_mrr_at_5_max": 0.658966, + "nauc_mrr_at_5_std": -0.296724, + "nauc_mrr_at_5_diff1": 0.898412, + "nauc_mrr_at_10_max": 0.657607, + "nauc_mrr_at_10_std": -0.293575, + "nauc_mrr_at_10_diff1": 0.8989, + "nauc_mrr_at_20_max": 0.656078, + "nauc_mrr_at_20_std": -0.293196, + "nauc_mrr_at_20_diff1": 0.899102, + "nauc_mrr_at_100_max": 0.655219, + "nauc_mrr_at_100_std": -0.29367, + "nauc_mrr_at_100_diff1": 0.89914, + "nauc_mrr_at_1000_max": 0.655151, + "nauc_mrr_at_1000_std": -0.293827, + "nauc_mrr_at_1000_diff1": 0.89915, + "main_score": 0.92061, + "hf_subset": "php", + "languages": [ + "php-Code" + ] + } + ] + }, + "evaluation_time": 442.222136259079, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeTransOceanContest.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeTransOceanContest.json new file mode 100644 index 0000000000..4b278b4674 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeTransOceanContest.json @@ -0,0 +1,159 @@ +{ + "dataset_revision": "20da4eb20a4b17300c0986ee148c90867a7f2a4d", + "task_name": "CodeTransOceanContest", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.62443, + "ndcg_at_3": 0.70523, + "ndcg_at_5": 0.71828, + "ndcg_at_10": 0.73023, + "ndcg_at_20": 0.74269, + "ndcg_at_100": 0.75512, + "ndcg_at_1000": 0.76154, + "map_at_1": 0.62443, + "map_at_3": 0.68477, + "map_at_5": 0.69201, + "map_at_10": 0.69708, + "map_at_20": 0.70043, + "map_at_100": 0.70207, + "map_at_1000": 0.70231, + "recall_at_1": 0.62443, + "recall_at_3": 0.76471, + "recall_at_5": 0.79638, + "recall_at_10": 0.83258, + "recall_at_20": 0.88235, + "recall_at_100": 0.95023, + "recall_at_1000": 1.0, + "precision_at_1": 0.62443, + "precision_at_3": 0.2549, + "precision_at_5": 0.15928, + "precision_at_10": 0.08326, + "precision_at_20": 0.04412, + "precision_at_100": 0.0095, + "precision_at_1000": 0.001, + "mrr_at_1": 0.624434, + "mrr_at_3": 0.684766, + "mrr_at_5": 0.692006, + "mrr_at_10": 0.697082, + "mrr_at_20": 0.700434, + "mrr_at_100": 0.702067, + "mrr_at_1000": 0.702313, + "nauc_ndcg_at_1_max": 0.636437, + "nauc_ndcg_at_1_std": -0.205381, + "nauc_ndcg_at_1_diff1": 0.816147, + "nauc_ndcg_at_3_max": 0.620599, + "nauc_ndcg_at_3_std": -0.245431, + "nauc_ndcg_at_3_diff1": 0.766039, + "nauc_ndcg_at_5_max": 0.623674, + "nauc_ndcg_at_5_std": -0.211724, + "nauc_ndcg_at_5_diff1": 0.759409, + "nauc_ndcg_at_10_max": 0.623656, + "nauc_ndcg_at_10_std": -0.216514, + "nauc_ndcg_at_10_diff1": 0.757428, + "nauc_ndcg_at_20_max": 0.628353, + "nauc_ndcg_at_20_std": -0.208346, + "nauc_ndcg_at_20_diff1": 0.752952, + "nauc_ndcg_at_100_max": 0.618402, + "nauc_ndcg_at_100_std": -0.21579, + "nauc_ndcg_at_100_diff1": 0.757505, + "nauc_ndcg_at_1000_max": 0.6249, + "nauc_ndcg_at_1000_std": -0.215519, + "nauc_ndcg_at_1000_diff1": 0.764662, + "nauc_map_at_1_max": 0.636437, + "nauc_map_at_1_std": -0.205381, + "nauc_map_at_1_diff1": 0.816147, + "nauc_map_at_3_max": 0.625265, + "nauc_map_at_3_std": -0.23754, + "nauc_map_at_3_diff1": 0.779428, + "nauc_map_at_5_max": 0.626306, + "nauc_map_at_5_std": -0.219713, + "nauc_map_at_5_diff1": 0.775841, + "nauc_map_at_10_max": 0.626475, + "nauc_map_at_10_std": -0.221416, + "nauc_map_at_10_diff1": 0.775233, + "nauc_map_at_20_max": 0.627781, + "nauc_map_at_20_std": -0.218868, + "nauc_map_at_20_diff1": 0.774179, + "nauc_map_at_100_max": 0.626586, + "nauc_map_at_100_std": -0.22013, + "nauc_map_at_100_diff1": 0.774734, + "nauc_map_at_1000_max": 0.626886, + "nauc_map_at_1000_std": -0.219846, + "nauc_map_at_1000_diff1": 0.774972, + "nauc_recall_at_1_max": 0.636437, + "nauc_recall_at_1_std": -0.205381, + "nauc_recall_at_1_diff1": 0.816147, + "nauc_recall_at_3_max": 0.603724, + "nauc_recall_at_3_std": -0.272103, + "nauc_recall_at_3_diff1": 0.718264, + "nauc_recall_at_5_max": 0.614835, + "nauc_recall_at_5_std": -0.17238, + "nauc_recall_at_5_diff1": 0.694407, + "nauc_recall_at_10_max": 0.61189, + "nauc_recall_at_10_std": -0.188246, + "nauc_recall_at_10_diff1": 0.674057, + "nauc_recall_at_20_max": 0.640424, + "nauc_recall_at_20_std": -0.126591, + "nauc_recall_at_20_diff1": 0.611969, + "nauc_recall_at_100_max": 0.437815, + "nauc_recall_at_100_std": -0.159148, + "nauc_recall_at_100_diff1": 0.533739, + "nauc_recall_at_1000_max": NaN, + "nauc_recall_at_1000_std": NaN, + "nauc_recall_at_1000_diff1": NaN, + "nauc_precision_at_1_max": 0.636437, + "nauc_precision_at_1_std": -0.205381, + "nauc_precision_at_1_diff1": 0.816147, + "nauc_precision_at_3_max": 0.603724, + "nauc_precision_at_3_std": -0.272103, + "nauc_precision_at_3_diff1": 0.718264, + "nauc_precision_at_5_max": 0.614835, + "nauc_precision_at_5_std": -0.17238, + "nauc_precision_at_5_diff1": 0.694407, + "nauc_precision_at_10_max": 0.61189, + "nauc_precision_at_10_std": -0.188246, + "nauc_precision_at_10_diff1": 0.674057, + "nauc_precision_at_20_max": 0.640424, + "nauc_precision_at_20_std": -0.126591, + "nauc_precision_at_20_diff1": 0.611969, + "nauc_precision_at_100_max": 0.437815, + "nauc_precision_at_100_std": -0.159148, + "nauc_precision_at_100_diff1": 0.533739, + "nauc_precision_at_1000_max": 1.0, + "nauc_precision_at_1000_std": 1.0, + "nauc_precision_at_1000_diff1": 1.0, + "nauc_mrr_at_1_max": 0.636437, + "nauc_mrr_at_1_std": -0.205381, + "nauc_mrr_at_1_diff1": 0.816147, + "nauc_mrr_at_3_max": 0.625265, + "nauc_mrr_at_3_std": -0.23754, + "nauc_mrr_at_3_diff1": 0.779428, + "nauc_mrr_at_5_max": 0.626306, + "nauc_mrr_at_5_std": -0.219713, + "nauc_mrr_at_5_diff1": 0.775841, + "nauc_mrr_at_10_max": 0.626475, + "nauc_mrr_at_10_std": -0.221416, + "nauc_mrr_at_10_diff1": 0.775233, + "nauc_mrr_at_20_max": 0.627781, + "nauc_mrr_at_20_std": -0.218868, + "nauc_mrr_at_20_diff1": 0.774179, + "nauc_mrr_at_100_max": 0.626586, + "nauc_mrr_at_100_std": -0.22013, + "nauc_mrr_at_100_diff1": 0.774734, + "nauc_mrr_at_1000_max": 0.626886, + "nauc_mrr_at_1000_std": -0.219846, + "nauc_mrr_at_1000_diff1": 0.774972, + "main_score": 0.73023, + "hf_subset": "default", + "languages": [ + "python-Code", + "c++-Code" + ] + } + ] + }, + "evaluation_time": 1.4903316497802734, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeTransOceanDL.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeTransOceanDL.json new file mode 100644 index 0000000000..a0331ed5d1 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CodeTransOceanDL.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "281562cb8a1265ab5c0824bfa6ddcd9b0a15618f", + "task_name": "CodeTransOceanDL", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.08333, + "ndcg_at_3": 0.14616, + "ndcg_at_5": 0.21526, + "ndcg_at_10": 0.36099, + "ndcg_at_20": 0.40835, + "ndcg_at_100": 0.41079, + "ndcg_at_1000": 0.41079, + "map_at_1": 0.08333, + "map_at_3": 0.12963, + "map_at_5": 0.16824, + "map_at_10": 0.22743, + "map_at_20": 0.24249, + "map_at_100": 0.24299, + "map_at_1000": 0.24299, + "recall_at_1": 0.08333, + "recall_at_3": 0.19444, + "recall_at_5": 0.36111, + "recall_at_10": 0.81667, + "recall_at_20": 0.98889, + "recall_at_100": 1.0, + "recall_at_1000": 1.0, + "precision_at_1": 0.08333, + "precision_at_3": 0.06481, + "precision_at_5": 0.07222, + "precision_at_10": 0.08167, + "precision_at_20": 0.04944, + "precision_at_100": 0.01, + "precision_at_1000": 0.001, + "mrr_at_1": 0.077778, + "mrr_at_3": 0.127778, + "mrr_at_5": 0.160556, + "mrr_at_10": 0.224795, + "mrr_at_20": 0.238162, + "mrr_at_100": 0.238393, + "mrr_at_1000": 0.238393, + "nauc_ndcg_at_1_max": -0.385404, + "nauc_ndcg_at_1_std": -0.247867, + "nauc_ndcg_at_1_diff1": 0.002737, + "nauc_ndcg_at_3_max": -0.432872, + "nauc_ndcg_at_3_std": -0.224822, + "nauc_ndcg_at_3_diff1": 0.119364, + "nauc_ndcg_at_5_max": -0.367775, + "nauc_ndcg_at_5_std": -0.164777, + "nauc_ndcg_at_5_diff1": 0.115921, + "nauc_ndcg_at_10_max": -0.347495, + "nauc_ndcg_at_10_std": -0.235082, + "nauc_ndcg_at_10_diff1": 0.08545, + "nauc_ndcg_at_20_max": -0.367922, + "nauc_ndcg_at_20_std": -0.187981, + "nauc_ndcg_at_20_diff1": 0.099941, + "nauc_ndcg_at_100_max": -0.371084, + "nauc_ndcg_at_100_std": -0.199916, + "nauc_ndcg_at_100_diff1": 0.087746, + "nauc_ndcg_at_1000_max": -0.371084, + "nauc_ndcg_at_1000_std": -0.199916, + "nauc_ndcg_at_1000_diff1": 0.087746, + "nauc_map_at_1_max": -0.385404, + "nauc_map_at_1_std": -0.247867, + "nauc_map_at_1_diff1": 0.002737, + "nauc_map_at_3_max": -0.423341, + "nauc_map_at_3_std": -0.229222, + "nauc_map_at_3_diff1": 0.097135, + "nauc_map_at_5_max": -0.377152, + "nauc_map_at_5_std": -0.188776, + "nauc_map_at_5_diff1": 0.096172, + "nauc_map_at_10_max": -0.367331, + "nauc_map_at_10_std": -0.216985, + "nauc_map_at_10_diff1": 0.080193, + "nauc_map_at_20_max": -0.374702, + "nauc_map_at_20_std": -0.203118, + "nauc_map_at_20_diff1": 0.084017, + "nauc_map_at_100_max": -0.375246, + "nauc_map_at_100_std": -0.205146, + "nauc_map_at_100_diff1": 0.081962, + "nauc_map_at_1000_max": -0.375246, + "nauc_map_at_1000_std": -0.205146, + "nauc_map_at_1000_diff1": 0.081962, + "nauc_recall_at_1_max": -0.385404, + "nauc_recall_at_1_std": -0.247867, + "nauc_recall_at_1_diff1": 0.002737, + "nauc_recall_at_3_max": -0.453043, + "nauc_recall_at_3_std": -0.215565, + "nauc_recall_at_3_diff1": 0.166109, + "nauc_recall_at_5_max": -0.349583, + "nauc_recall_at_5_std": -0.117584, + "nauc_recall_at_5_diff1": 0.151929, + "nauc_recall_at_10_max": -0.27302, + "nauc_recall_at_10_std": -0.337124, + "nauc_recall_at_10_diff1": 0.091072, + "nauc_recall_at_20_max": -0.171335, + "nauc_recall_at_20_std": 0.554155, + "nauc_recall_at_20_diff1": 0.861111, + "nauc_recall_at_100_max": NaN, + "nauc_recall_at_100_std": NaN, + "nauc_recall_at_100_diff1": NaN, + "nauc_recall_at_1000_max": NaN, + "nauc_recall_at_1000_std": NaN, + "nauc_recall_at_1000_diff1": NaN, + "nauc_precision_at_1_max": -0.385404, + "nauc_precision_at_1_std": -0.247867, + "nauc_precision_at_1_diff1": 0.002737, + "nauc_precision_at_3_max": -0.453043, + "nauc_precision_at_3_std": -0.215565, + "nauc_precision_at_3_diff1": 0.166109, + "nauc_precision_at_5_max": -0.349583, + "nauc_precision_at_5_std": -0.117584, + "nauc_precision_at_5_diff1": 0.151929, + "nauc_precision_at_10_max": -0.27302, + "nauc_precision_at_10_std": -0.337124, + "nauc_precision_at_10_diff1": 0.091072, + "nauc_precision_at_20_max": -0.171335, + "nauc_precision_at_20_std": 0.554155, + "nauc_precision_at_20_diff1": 0.861111, + "nauc_precision_at_100_max": 1.0, + "nauc_precision_at_100_std": 1.0, + "nauc_precision_at_100_diff1": 1.0, + "nauc_precision_at_1000_max": 1.0, + "nauc_precision_at_1000_std": 1.0, + "nauc_precision_at_1000_diff1": 1.0, + "nauc_mrr_at_1_max": -0.377247, + "nauc_mrr_at_1_std": -0.229886, + "nauc_mrr_at_1_diff1": 0.032581, + "nauc_mrr_at_3_max": -0.381943, + "nauc_mrr_at_3_std": -0.201363, + "nauc_mrr_at_3_diff1": 0.076468, + "nauc_mrr_at_5_max": -0.349148, + "nauc_mrr_at_5_std": -0.173706, + "nauc_mrr_at_5_diff1": 0.120541, + "nauc_mrr_at_10_max": -0.349108, + "nauc_mrr_at_10_std": -0.188868, + "nauc_mrr_at_10_diff1": 0.106873, + "nauc_mrr_at_20_max": -0.347074, + "nauc_mrr_at_20_std": -0.182817, + "nauc_mrr_at_20_diff1": 0.098891, + "nauc_mrr_at_100_max": -0.347301, + "nauc_mrr_at_100_std": -0.18377, + "nauc_mrr_at_100_diff1": 0.097725, + "nauc_mrr_at_1000_max": -0.347301, + "nauc_mrr_at_1000_std": -0.18377, + "nauc_mrr_at_1000_diff1": 0.097725, + "main_score": 0.36099, + "hf_subset": "default", + "languages": [ + "python-Code" + ] + } + ] + }, + "evaluation_time": 1.404336929321289, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CosQA.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CosQA.json new file mode 100644 index 0000000000..1496c4eb94 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/CosQA.json @@ -0,0 +1,159 @@ +{ + "dataset_revision": "bc5efb7e9d437246ce393ed19d772e08e4a79535", + "task_name": "CosQA", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.204, + "ndcg_at_3": 0.30357, + "ndcg_at_5": 0.36623, + "ndcg_at_10": 0.42175, + "ndcg_at_20": 0.4499, + "ndcg_at_100": 0.47951, + "ndcg_at_1000": 0.48391, + "map_at_1": 0.204, + "map_at_3": 0.278, + "map_at_5": 0.3128, + "map_at_10": 0.33603, + "map_at_20": 0.34393, + "map_at_100": 0.34827, + "map_at_1000": 0.34844, + "recall_at_1": 0.204, + "recall_at_3": 0.378, + "recall_at_5": 0.53, + "recall_at_10": 0.7, + "recall_at_20": 0.81, + "recall_at_100": 0.966, + "recall_at_1000": 1.0, + "precision_at_1": 0.204, + "precision_at_3": 0.126, + "precision_at_5": 0.106, + "precision_at_10": 0.07, + "precision_at_20": 0.0405, + "precision_at_100": 0.00966, + "precision_at_1000": 0.001, + "mrr_at_1": 0.196, + "mrr_at_3": 0.261667, + "mrr_at_5": 0.291667, + "mrr_at_10": 0.317115, + "mrr_at_20": 0.326484, + "mrr_at_100": 0.330951, + "mrr_at_1000": 0.331125, + "nauc_ndcg_at_1_max": 0.050728, + "nauc_ndcg_at_1_std": -0.069837, + "nauc_ndcg_at_1_diff1": 0.322639, + "nauc_ndcg_at_3_max": 0.078884, + "nauc_ndcg_at_3_std": -0.080157, + "nauc_ndcg_at_3_diff1": 0.205242, + "nauc_ndcg_at_5_max": 0.106716, + "nauc_ndcg_at_5_std": -0.063355, + "nauc_ndcg_at_5_diff1": 0.181632, + "nauc_ndcg_at_10_max": 0.102381, + "nauc_ndcg_at_10_std": -0.084128, + "nauc_ndcg_at_10_diff1": 0.162447, + "nauc_ndcg_at_20_max": 0.117062, + "nauc_ndcg_at_20_std": -0.067782, + "nauc_ndcg_at_20_diff1": 0.172394, + "nauc_ndcg_at_100_max": 0.106957, + "nauc_ndcg_at_100_std": -0.061733, + "nauc_ndcg_at_100_diff1": 0.188506, + "nauc_ndcg_at_1000_max": 0.100223, + "nauc_ndcg_at_1000_std": -0.06977, + "nauc_ndcg_at_1000_diff1": 0.198541, + "nauc_map_at_1_max": 0.050728, + "nauc_map_at_1_std": -0.069837, + "nauc_map_at_1_diff1": 0.322639, + "nauc_map_at_3_max": 0.07279, + "nauc_map_at_3_std": -0.079651, + "nauc_map_at_3_diff1": 0.231934, + "nauc_map_at_5_max": 0.088576, + "nauc_map_at_5_std": -0.069613, + "nauc_map_at_5_diff1": 0.219877, + "nauc_map_at_10_max": 0.087203, + "nauc_map_at_10_std": -0.078027, + "nauc_map_at_10_diff1": 0.213149, + "nauc_map_at_20_max": 0.090772, + "nauc_map_at_20_std": -0.073855, + "nauc_map_at_20_diff1": 0.216904, + "nauc_map_at_100_max": 0.089428, + "nauc_map_at_100_std": -0.073159, + "nauc_map_at_100_diff1": 0.219165, + "nauc_map_at_1000_max": 0.089179, + "nauc_map_at_1000_std": -0.073391, + "nauc_map_at_1000_diff1": 0.219558, + "nauc_recall_at_1_max": 0.050728, + "nauc_recall_at_1_std": -0.069837, + "nauc_recall_at_1_diff1": 0.322639, + "nauc_recall_at_3_max": 0.094697, + "nauc_recall_at_3_std": -0.080825, + "nauc_recall_at_3_diff1": 0.135507, + "nauc_recall_at_5_max": 0.159626, + "nauc_recall_at_5_std": -0.043973, + "nauc_recall_at_5_diff1": 0.073112, + "nauc_recall_at_10_max": 0.154527, + "nauc_recall_at_10_std": -0.112527, + "nauc_recall_at_10_diff1": -0.026341, + "nauc_recall_at_20_max": 0.267002, + "nauc_recall_at_20_std": -0.023584, + "nauc_recall_at_20_diff1": -0.054262, + "nauc_recall_at_100_max": 0.478168, + "nauc_recall_at_100_std": 0.406272, + "nauc_recall_at_100_diff1": -0.351788, + "nauc_recall_at_1000_max": NaN, + "nauc_recall_at_1000_std": NaN, + "nauc_recall_at_1000_diff1": NaN, + "nauc_precision_at_1_max": 0.050728, + "nauc_precision_at_1_std": -0.069837, + "nauc_precision_at_1_diff1": 0.322639, + "nauc_precision_at_3_max": 0.094697, + "nauc_precision_at_3_std": -0.080825, + "nauc_precision_at_3_diff1": 0.135507, + "nauc_precision_at_5_max": 0.159626, + "nauc_precision_at_5_std": -0.043973, + "nauc_precision_at_5_diff1": 0.073112, + "nauc_precision_at_10_max": 0.154527, + "nauc_precision_at_10_std": -0.112527, + "nauc_precision_at_10_diff1": -0.026341, + "nauc_precision_at_20_max": 0.267002, + "nauc_precision_at_20_std": -0.023584, + "nauc_precision_at_20_diff1": -0.054262, + "nauc_precision_at_100_max": 0.478168, + "nauc_precision_at_100_std": 0.406272, + "nauc_precision_at_100_diff1": -0.351788, + "nauc_precision_at_1000_max": 1.0, + "nauc_precision_at_1000_std": 1.0, + "nauc_precision_at_1000_diff1": 1.0, + "nauc_mrr_at_1_max": 0.009023, + "nauc_mrr_at_1_std": -0.18106, + "nauc_mrr_at_1_diff1": 0.34852, + "nauc_mrr_at_3_max": 0.025663, + "nauc_mrr_at_3_std": -0.160123, + "nauc_mrr_at_3_diff1": 0.269201, + "nauc_mrr_at_5_max": 0.033745, + "nauc_mrr_at_5_std": -0.15786, + "nauc_mrr_at_5_diff1": 0.259661, + "nauc_mrr_at_10_max": 0.034283, + "nauc_mrr_at_10_std": -0.162426, + "nauc_mrr_at_10_diff1": 0.241737, + "nauc_mrr_at_20_max": 0.038542, + "nauc_mrr_at_20_std": -0.159906, + "nauc_mrr_at_20_diff1": 0.246013, + "nauc_mrr_at_100_max": 0.038587, + "nauc_mrr_at_100_std": -0.158926, + "nauc_mrr_at_100_diff1": 0.248046, + "nauc_mrr_at_1000_max": 0.038305, + "nauc_mrr_at_1000_std": -0.159211, + "nauc_mrr_at_1000_diff1": 0.248462, + "main_score": 0.42175, + "hf_subset": "default", + "languages": [ + "eng-Latn", + "python-Code" + ] + } + ] + }, + "evaluation_time": 3.2009878158569336, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/DBPedia.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/DBPedia.json new file mode 100644 index 0000000000..c35592650b --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/DBPedia.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "c0f706b76e590d620bd6618b3ca8efdd34e2d659", + "task_name": "DBPedia", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.55375, + "ndcg_at_3": 0.45367, + "ndcg_at_5": 0.42663, + "ndcg_at_10": 0.41388, + "ndcg_at_20": 0.40781, + "ndcg_at_100": 0.45968, + "ndcg_at_1000": 0.53013, + "map_at_1": 0.09499, + "map_at_3": 0.14105, + "map_at_5": 0.16163, + "map_at_10": 0.19547, + "map_at_20": 0.22422, + "map_at_100": 0.27104, + "map_at_1000": 0.28721, + "recall_at_1": 0.09499, + "recall_at_3": 0.15388, + "recall_at_5": 0.18644, + "recall_at_10": 0.25366, + "recall_at_20": 0.325, + "recall_at_100": 0.5151, + "recall_at_1000": 0.73716, + "precision_at_1": 0.6725, + "precision_at_3": 0.47083, + "precision_at_5": 0.3975, + "precision_at_10": 0.32075, + "precision_at_20": 0.24062, + "precision_at_100": 0.10398, + "precision_at_1000": 0.02109, + "mrr_at_1": 0.6725, + "mrr_at_3": 0.7375, + "mrr_at_5": 0.748875, + "mrr_at_10": 0.754502, + "mrr_at_20": 0.757139, + "mrr_at_100": 0.757974, + "mrr_at_1000": 0.758072, + "nauc_ndcg_at_1_max": 0.426545, + "nauc_ndcg_at_1_std": 0.261861, + "nauc_ndcg_at_1_diff1": 0.499532, + "nauc_ndcg_at_3_max": 0.345207, + "nauc_ndcg_at_3_std": 0.27884, + "nauc_ndcg_at_3_diff1": 0.35129, + "nauc_ndcg_at_5_max": 0.345528, + "nauc_ndcg_at_5_std": 0.287234, + "nauc_ndcg_at_5_diff1": 0.336494, + "nauc_ndcg_at_10_max": 0.351302, + "nauc_ndcg_at_10_std": 0.301841, + "nauc_ndcg_at_10_diff1": 0.344625, + "nauc_ndcg_at_20_max": 0.352172, + "nauc_ndcg_at_20_std": 0.279865, + "nauc_ndcg_at_20_diff1": 0.358719, + "nauc_ndcg_at_100_max": 0.369835, + "nauc_ndcg_at_100_std": 0.327226, + "nauc_ndcg_at_100_diff1": 0.339169, + "nauc_ndcg_at_1000_max": 0.39362, + "nauc_ndcg_at_1000_std": 0.405204, + "nauc_ndcg_at_1000_diff1": 0.344677, + "nauc_map_at_1_max": 0.06067, + "nauc_map_at_1_std": -0.124755, + "nauc_map_at_1_diff1": 0.400801, + "nauc_map_at_3_max": 0.076959, + "nauc_map_at_3_std": -0.071405, + "nauc_map_at_3_diff1": 0.312565, + "nauc_map_at_5_max": 0.111585, + "nauc_map_at_5_std": -0.03276, + "nauc_map_at_5_diff1": 0.313251, + "nauc_map_at_10_max": 0.160756, + "nauc_map_at_10_std": 0.030405, + "nauc_map_at_10_diff1": 0.298738, + "nauc_map_at_20_max": 0.209185, + "nauc_map_at_20_std": 0.1021, + "nauc_map_at_20_diff1": 0.297573, + "nauc_map_at_100_max": 0.25491, + "nauc_map_at_100_std": 0.219107, + "nauc_map_at_100_diff1": 0.270017, + "nauc_map_at_1000_max": 0.259302, + "nauc_map_at_1000_std": 0.253499, + "nauc_map_at_1000_diff1": 0.263966, + "nauc_recall_at_1_max": 0.06067, + "nauc_recall_at_1_std": -0.124755, + "nauc_recall_at_1_diff1": 0.400801, + "nauc_recall_at_3_max": 0.042574, + "nauc_recall_at_3_std": -0.089709, + "nauc_recall_at_3_diff1": 0.258459, + "nauc_recall_at_5_max": 0.083433, + "nauc_recall_at_5_std": -0.051731, + "nauc_recall_at_5_diff1": 0.263208, + "nauc_recall_at_10_max": 0.140344, + "nauc_recall_at_10_std": 0.00534, + "nauc_recall_at_10_diff1": 0.238273, + "nauc_recall_at_20_max": 0.203901, + "nauc_recall_at_20_std": 0.074582, + "nauc_recall_at_20_diff1": 0.247213, + "nauc_recall_at_100_max": 0.277437, + "nauc_recall_at_100_std": 0.272708, + "nauc_recall_at_100_diff1": 0.201935, + "nauc_recall_at_1000_max": 0.336366, + "nauc_recall_at_1000_std": 0.437369, + "nauc_recall_at_1000_diff1": 0.213234, + "nauc_precision_at_1_max": 0.486399, + "nauc_precision_at_1_std": 0.315921, + "nauc_precision_at_1_diff1": 0.526191, + "nauc_precision_at_3_max": 0.307748, + "nauc_precision_at_3_std": 0.358095, + "nauc_precision_at_3_diff1": 0.135111, + "nauc_precision_at_5_max": 0.32002, + "nauc_precision_at_5_std": 0.40832, + "nauc_precision_at_5_diff1": 0.080034, + "nauc_precision_at_10_max": 0.302004, + "nauc_precision_at_10_std": 0.453337, + "nauc_precision_at_10_diff1": 0.021409, + "nauc_precision_at_20_max": 0.296512, + "nauc_precision_at_20_std": 0.474241, + "nauc_precision_at_20_diff1": 0.009284, + "nauc_precision_at_100_max": 0.169896, + "nauc_precision_at_100_std": 0.428678, + "nauc_precision_at_100_diff1": -0.066789, + "nauc_precision_at_1000_max": -0.023649, + "nauc_precision_at_1000_std": 0.215565, + "nauc_precision_at_1000_diff1": -0.163932, + "nauc_mrr_at_1_max": 0.486399, + "nauc_mrr_at_1_std": 0.315921, + "nauc_mrr_at_1_diff1": 0.526191, + "nauc_mrr_at_3_max": 0.481402, + "nauc_mrr_at_3_std": 0.329776, + "nauc_mrr_at_3_diff1": 0.50619, + "nauc_mrr_at_5_max": 0.487003, + "nauc_mrr_at_5_std": 0.337776, + "nauc_mrr_at_5_diff1": 0.501305, + "nauc_mrr_at_10_max": 0.48624, + "nauc_mrr_at_10_std": 0.33774, + "nauc_mrr_at_10_diff1": 0.498495, + "nauc_mrr_at_20_max": 0.490613, + "nauc_mrr_at_20_std": 0.34082, + "nauc_mrr_at_20_diff1": 0.503306, + "nauc_mrr_at_100_max": 0.489821, + "nauc_mrr_at_100_std": 0.33963, + "nauc_mrr_at_100_diff1": 0.503003, + "nauc_mrr_at_1000_max": 0.489699, + "nauc_mrr_at_1000_std": 0.339473, + "nauc_mrr_at_1000_diff1": 0.503152, + "main_score": 0.41388, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 247.7287290096283, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/EmotionClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/EmotionClassification.json new file mode 100644 index 0000000000..aed67cc7bf --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/EmotionClassification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "4f58c6b202a23cf9a4da393831edf4f9183cad37", + "task_name": "EmotionClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.5039, + "f1": 0.452184, + "f1_weighted": 0.525821, + "scores_per_experiment": [ + { + "accuracy": 0.502, + "f1": 0.447035, + "f1_weighted": 0.524061 + }, + { + "accuracy": 0.4785, + "f1": 0.432188, + "f1_weighted": 0.499745 + }, + { + "accuracy": 0.4995, + "f1": 0.446911, + "f1_weighted": 0.521497 + }, + { + "accuracy": 0.495, + "f1": 0.44964, + "f1_weighted": 0.5218 + }, + { + "accuracy": 0.5215, + "f1": 0.468883, + "f1_weighted": 0.543659 + }, + { + "accuracy": 0.52, + "f1": 0.451911, + "f1_weighted": 0.5399 + }, + { + "accuracy": 0.507, + "f1": 0.453322, + "f1_weighted": 0.529803 + }, + { + "accuracy": 0.4945, + "f1": 0.45046, + "f1_weighted": 0.511576 + }, + { + "accuracy": 0.521, + "f1": 0.467047, + "f1_weighted": 0.543983 + }, + { + "accuracy": 0.5, + "f1": 0.454439, + "f1_weighted": 0.522183 + } + ], + "main_score": 0.5039, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 15.23106861114502, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/FEVER.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/FEVER.json new file mode 100644 index 0000000000..8f60f1c0ca --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/FEVER.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "bea83ef9e8fb933d90a2f1d5515737465d613e12", + "task_name": "FEVER", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.93054, + "ndcg_at_3": 0.93305, + "ndcg_at_5": 0.93648, + "ndcg_at_10": 0.93975, + "ndcg_at_20": 0.94189, + "ndcg_at_100": 0.94421, + "ndcg_at_1000": 0.94598, + "map_at_1": 0.86453, + "map_at_3": 0.91117, + "map_at_5": 0.91532, + "map_at_10": 0.9178, + "map_at_20": 0.91883, + "map_at_100": 0.91941, + "map_at_1000": 0.91952, + "recall_at_1": 0.86453, + "recall_at_3": 0.94423, + "recall_at_5": 0.95432, + "recall_at_10": 0.96356, + "recall_at_20": 0.96991, + "recall_at_100": 0.97913, + "recall_at_1000": 0.98955, + "precision_at_1": 0.93054, + "precision_at_3": 0.34653, + "precision_at_5": 0.212, + "precision_at_10": 0.10821, + "precision_at_20": 0.05496, + "precision_at_100": 0.01126, + "precision_at_1000": 0.00116, + "mrr_at_1": 0.930543, + "mrr_at_3": 0.960946, + "mrr_at_5": 0.961786, + "mrr_at_10": 0.962055, + "mrr_at_20": 0.962077, + "mrr_at_100": 0.962086, + "mrr_at_1000": 0.962088, + "nauc_ndcg_at_1_max": 0.252083, + "nauc_ndcg_at_1_std": -0.17856, + "nauc_ndcg_at_1_diff1": 0.85128, + "nauc_ndcg_at_3_max": 0.161453, + "nauc_ndcg_at_3_std": -0.027748, + "nauc_ndcg_at_3_diff1": 0.448335, + "nauc_ndcg_at_5_max": 0.164521, + "nauc_ndcg_at_5_std": -0.015049, + "nauc_ndcg_at_5_diff1": 0.429626, + "nauc_ndcg_at_10_max": 0.166731, + "nauc_ndcg_at_10_std": 1e-06, + "nauc_ndcg_at_10_diff1": 0.424544, + "nauc_ndcg_at_20_max": 0.171676, + "nauc_ndcg_at_20_std": 0.00221, + "nauc_ndcg_at_20_diff1": 0.436716, + "nauc_ndcg_at_100_max": 0.179397, + "nauc_ndcg_at_100_std": 0.003518, + "nauc_ndcg_at_100_diff1": 0.448508, + "nauc_ndcg_at_1000_max": 0.185414, + "nauc_ndcg_at_1000_std": -0.003267, + "nauc_ndcg_at_1000_diff1": 0.463582, + "nauc_map_at_1_max": 0.161669, + "nauc_map_at_1_std": -0.069106, + "nauc_map_at_1_diff1": 0.535154, + "nauc_map_at_3_max": 0.151188, + "nauc_map_at_3_std": -0.025756, + "nauc_map_at_3_diff1": 0.427854, + "nauc_map_at_5_max": 0.156808, + "nauc_map_at_5_std": -0.020649, + "nauc_map_at_5_diff1": 0.426272, + "nauc_map_at_10_max": 0.160198, + "nauc_map_at_10_std": -0.013874, + "nauc_map_at_10_diff1": 0.427453, + "nauc_map_at_20_max": 0.162157, + "nauc_map_at_20_std": -0.012885, + "nauc_map_at_20_diff1": 0.431304, + "nauc_map_at_100_max": 0.163932, + "nauc_map_at_100_std": -0.012345, + "nauc_map_at_100_diff1": 0.43338, + "nauc_map_at_1000_max": 0.164221, + "nauc_map_at_1000_std": -0.012522, + "nauc_map_at_1000_diff1": 0.433935, + "nauc_recall_at_1_max": 0.161669, + "nauc_recall_at_1_std": -0.069106, + "nauc_recall_at_1_diff1": 0.535154, + "nauc_recall_at_3_max": 0.089685, + "nauc_recall_at_3_std": 0.076678, + "nauc_recall_at_3_diff1": 0.175045, + "nauc_recall_at_5_max": 0.11359, + "nauc_recall_at_5_std": 0.134785, + "nauc_recall_at_5_diff1": 0.102669, + "nauc_recall_at_10_max": 0.121499, + "nauc_recall_at_10_std": 0.227543, + "nauc_recall_at_10_diff1": 0.029265, + "nauc_recall_at_20_max": 0.142036, + "nauc_recall_at_20_std": 0.285153, + "nauc_recall_at_20_diff1": 0.022343, + "nauc_recall_at_100_max": 0.187474, + "nauc_recall_at_100_std": 0.409635, + "nauc_recall_at_100_diff1": -0.037421, + "nauc_recall_at_1000_max": 0.357464, + "nauc_recall_at_1000_std": 0.59188, + "nauc_recall_at_1000_diff1": -0.088234, + "nauc_precision_at_1_max": 0.252083, + "nauc_precision_at_1_std": -0.17856, + "nauc_precision_at_1_diff1": 0.85128, + "nauc_precision_at_3_max": -0.009028, + "nauc_precision_at_3_std": 0.024311, + "nauc_precision_at_3_diff1": -0.155788, + "nauc_precision_at_5_max": -0.013704, + "nauc_precision_at_5_std": 0.033588, + "nauc_precision_at_5_diff1": -0.192581, + "nauc_precision_at_10_max": -0.012697, + "nauc_precision_at_10_std": 0.054479, + "nauc_precision_at_10_diff1": -0.193508, + "nauc_precision_at_20_max": -0.011103, + "nauc_precision_at_20_std": 0.05196, + "nauc_precision_at_20_diff1": -0.167918, + "nauc_precision_at_100_max": 0.007296, + "nauc_precision_at_100_std": 0.051753, + "nauc_precision_at_100_diff1": -0.140287, + "nauc_precision_at_1000_max": 0.012832, + "nauc_precision_at_1000_std": 0.020066, + "nauc_precision_at_1000_diff1": -0.102397, + "nauc_mrr_at_1_max": 0.252083, + "nauc_mrr_at_1_std": -0.17856, + "nauc_mrr_at_1_diff1": 0.85128, + "nauc_mrr_at_3_max": 0.237393, + "nauc_mrr_at_3_std": -0.198359, + "nauc_mrr_at_3_diff1": 0.845402, + "nauc_mrr_at_5_max": 0.246728, + "nauc_mrr_at_5_std": -0.191389, + "nauc_mrr_at_5_diff1": 0.845652, + "nauc_mrr_at_10_max": 0.246154, + "nauc_mrr_at_10_std": -0.189248, + "nauc_mrr_at_10_diff1": 0.8453, + "nauc_mrr_at_20_max": 0.246711, + "nauc_mrr_at_20_std": -0.188846, + "nauc_mrr_at_20_diff1": 0.845634, + "nauc_mrr_at_100_max": 0.246527, + "nauc_mrr_at_100_std": -0.189125, + "nauc_mrr_at_100_diff1": 0.845692, + "nauc_mrr_at_1000_max": 0.246513, + "nauc_mrr_at_1000_std": -0.189163, + "nauc_mrr_at_1000_diff1": 0.84569, + "main_score": 0.93975, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 824.7792942523956, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/FiQA2018.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/FiQA2018.json new file mode 100644 index 0000000000..11bf499508 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/FiQA2018.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "27a168819829fe9bcd655c2df245fb19452e8e06", + "task_name": "FiQA2018", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.47994, + "ndcg_at_3": 0.45003, + "ndcg_at_5": 0.46467, + "ndcg_at_10": 0.49542, + "ndcg_at_20": 0.52347, + "ndcg_at_100": 0.56426, + "ndcg_at_1000": 0.58584, + "map_at_1": 0.24184, + "map_at_3": 0.34896, + "map_at_5": 0.38017, + "map_at_10": 0.40433, + "map_at_20": 0.41599, + "map_at_100": 0.42546, + "map_at_1000": 0.42697, + "recall_at_1": 0.24184, + "recall_at_3": 0.41532, + "recall_at_5": 0.48691, + "recall_at_10": 0.58282, + "recall_at_20": 0.66892, + "recall_at_100": 0.83285, + "recall_at_1000": 0.95643, + "precision_at_1": 0.47994, + "precision_at_3": 0.30041, + "precision_at_5": 0.22222, + "precision_at_10": 0.13812, + "precision_at_20": 0.08102, + "precision_at_100": 0.0209, + "precision_at_1000": 0.0025, + "mrr_at_1": 0.479938, + "mrr_at_3": 0.557613, + "mrr_at_5": 0.571116, + "mrr_at_10": 0.581197, + "mrr_at_20": 0.584965, + "mrr_at_100": 0.587569, + "mrr_at_1000": 0.587761, + "nauc_ndcg_at_1_max": 0.487468, + "nauc_ndcg_at_1_std": -0.042375, + "nauc_ndcg_at_1_diff1": 0.564762, + "nauc_ndcg_at_3_max": 0.400522, + "nauc_ndcg_at_3_std": -0.045477, + "nauc_ndcg_at_3_diff1": 0.415273, + "nauc_ndcg_at_5_max": 0.38792, + "nauc_ndcg_at_5_std": -0.050248, + "nauc_ndcg_at_5_diff1": 0.409163, + "nauc_ndcg_at_10_max": 0.389776, + "nauc_ndcg_at_10_std": -0.043409, + "nauc_ndcg_at_10_diff1": 0.417032, + "nauc_ndcg_at_20_max": 0.410843, + "nauc_ndcg_at_20_std": -0.021178, + "nauc_ndcg_at_20_diff1": 0.429348, + "nauc_ndcg_at_100_max": 0.424812, + "nauc_ndcg_at_100_std": -0.00632, + "nauc_ndcg_at_100_diff1": 0.434032, + "nauc_ndcg_at_1000_max": 0.430017, + "nauc_ndcg_at_1000_std": -0.006675, + "nauc_ndcg_at_1000_diff1": 0.439787, + "nauc_map_at_1_max": 0.253001, + "nauc_map_at_1_std": -0.093826, + "nauc_map_at_1_diff1": 0.516075, + "nauc_map_at_3_max": 0.312477, + "nauc_map_at_3_std": -0.083247, + "nauc_map_at_3_diff1": 0.430323, + "nauc_map_at_5_max": 0.339702, + "nauc_map_at_5_std": -0.07602, + "nauc_map_at_5_diff1": 0.414358, + "nauc_map_at_10_max": 0.360823, + "nauc_map_at_10_std": -0.067534, + "nauc_map_at_10_diff1": 0.413072, + "nauc_map_at_20_max": 0.371663, + "nauc_map_at_20_std": -0.057726, + "nauc_map_at_20_diff1": 0.417666, + "nauc_map_at_100_max": 0.377222, + "nauc_map_at_100_std": -0.052574, + "nauc_map_at_100_diff1": 0.419008, + "nauc_map_at_1000_max": 0.378021, + "nauc_map_at_1000_std": -0.052259, + "nauc_map_at_1000_diff1": 0.419534, + "nauc_recall_at_1_max": 0.253001, + "nauc_recall_at_1_std": -0.093826, + "nauc_recall_at_1_diff1": 0.516075, + "nauc_recall_at_3_max": 0.244207, + "nauc_recall_at_3_std": -0.081759, + "nauc_recall_at_3_diff1": 0.318741, + "nauc_recall_at_5_max": 0.266177, + "nauc_recall_at_5_std": -0.069537, + "nauc_recall_at_5_diff1": 0.286688, + "nauc_recall_at_10_max": 0.277053, + "nauc_recall_at_10_std": -0.047031, + "nauc_recall_at_10_diff1": 0.281842, + "nauc_recall_at_20_max": 0.324738, + "nauc_recall_at_20_std": 0.024561, + "nauc_recall_at_20_diff1": 0.301725, + "nauc_recall_at_100_max": 0.326635, + "nauc_recall_at_100_std": 0.127048, + "nauc_recall_at_100_diff1": 0.255138, + "nauc_recall_at_1000_max": 0.351364, + "nauc_recall_at_1000_std": 0.287146, + "nauc_recall_at_1000_diff1": 0.260137, + "nauc_precision_at_1_max": 0.487468, + "nauc_precision_at_1_std": -0.042375, + "nauc_precision_at_1_diff1": 0.564762, + "nauc_precision_at_3_max": 0.433288, + "nauc_precision_at_3_std": 0.016228, + "nauc_precision_at_3_diff1": 0.213604, + "nauc_precision_at_5_max": 0.431518, + "nauc_precision_at_5_std": 0.047605, + "nauc_precision_at_5_diff1": 0.142611, + "nauc_precision_at_10_max": 0.435286, + "nauc_precision_at_10_std": 0.097062, + "nauc_precision_at_10_diff1": 0.101759, + "nauc_precision_at_20_max": 0.414498, + "nauc_precision_at_20_std": 0.148533, + "nauc_precision_at_20_diff1": 0.082728, + "nauc_precision_at_100_max": 0.354594, + "nauc_precision_at_100_std": 0.182305, + "nauc_precision_at_100_diff1": 0.028412, + "nauc_precision_at_1000_max": 0.276594, + "nauc_precision_at_1000_std": 0.178554, + "nauc_precision_at_1000_diff1": -0.023887, + "nauc_mrr_at_1_max": 0.487468, + "nauc_mrr_at_1_std": -0.042375, + "nauc_mrr_at_1_diff1": 0.564762, + "nauc_mrr_at_3_max": 0.470286, + "nauc_mrr_at_3_std": -0.014574, + "nauc_mrr_at_3_diff1": 0.511183, + "nauc_mrr_at_5_max": 0.474527, + "nauc_mrr_at_5_std": -0.008493, + "nauc_mrr_at_5_diff1": 0.509085, + "nauc_mrr_at_10_max": 0.477689, + "nauc_mrr_at_10_std": -0.003375, + "nauc_mrr_at_10_diff1": 0.510834, + "nauc_mrr_at_20_max": 0.480061, + "nauc_mrr_at_20_std": -0.001552, + "nauc_mrr_at_20_diff1": 0.51248, + "nauc_mrr_at_100_max": 0.479843, + "nauc_mrr_at_100_std": -0.002465, + "nauc_mrr_at_100_diff1": 0.513004, + "nauc_mrr_at_1000_max": 0.479753, + "nauc_mrr_at_1000_std": -0.002578, + "nauc_mrr_at_1000_diff1": 0.513045, + "main_score": 0.49542, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 6.909597635269165, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/HotpotQA.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/HotpotQA.json new file mode 100644 index 0000000000..921e4dade1 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/HotpotQA.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "ab518f4d6fcca38d87c25209f94beba119d02014", + "task_name": "HotpotQA", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.85064, + "ndcg_at_3": 0.66717, + "ndcg_at_5": 0.68731, + "ndcg_at_10": 0.70391, + "ndcg_at_20": 0.71419, + "ndcg_at_100": 0.72954, + "ndcg_at_1000": 0.74157, + "map_at_1": 0.42532, + "map_at_3": 0.58985, + "map_at_5": 0.60645, + "map_at_10": 0.61663, + "map_at_20": 0.6208, + "map_at_100": 0.62401, + "map_at_1000": 0.62462, + "recall_at_1": 0.42532, + "recall_at_3": 0.62336, + "recall_at_5": 0.663, + "recall_at_10": 0.70452, + "recall_at_20": 0.73747, + "recall_at_100": 0.80533, + "recall_at_1000": 0.88562, + "precision_at_1": 0.85064, + "precision_at_3": 0.41558, + "precision_at_5": 0.2652, + "precision_at_10": 0.1409, + "precision_at_20": 0.07375, + "precision_at_100": 0.01611, + "precision_at_1000": 0.00177, + "mrr_at_1": 0.850641, + "mrr_at_3": 0.886023, + "mrr_at_5": 0.889507, + "mrr_at_10": 0.891734, + "mrr_at_20": 0.892723, + "mrr_at_100": 0.89314, + "mrr_at_1000": 0.893186, + "nauc_ndcg_at_1_max": 0.508573, + "nauc_ndcg_at_1_std": -0.082507, + "nauc_ndcg_at_1_diff1": 0.76269, + "nauc_ndcg_at_3_max": 0.143085, + "nauc_ndcg_at_3_std": 0.047004, + "nauc_ndcg_at_3_diff1": 0.138316, + "nauc_ndcg_at_5_max": 0.135109, + "nauc_ndcg_at_5_std": 0.068896, + "nauc_ndcg_at_5_diff1": 0.121147, + "nauc_ndcg_at_10_max": 0.129243, + "nauc_ndcg_at_10_std": 0.089594, + "nauc_ndcg_at_10_diff1": 0.107384, + "nauc_ndcg_at_20_max": 0.123969, + "nauc_ndcg_at_20_std": 0.100946, + "nauc_ndcg_at_20_diff1": 0.100086, + "nauc_ndcg_at_100_max": 0.123911, + "nauc_ndcg_at_100_std": 0.114712, + "nauc_ndcg_at_100_diff1": 0.100366, + "nauc_ndcg_at_1000_max": 0.131387, + "nauc_ndcg_at_1000_std": 0.114139, + "nauc_ndcg_at_1000_diff1": 0.108551, + "nauc_map_at_1_max": 0.508573, + "nauc_map_at_1_std": -0.082507, + "nauc_map_at_1_diff1": 0.76269, + "nauc_map_at_3_max": 0.093608, + "nauc_map_at_3_std": 0.051481, + "nauc_map_at_3_diff1": 0.073044, + "nauc_map_at_5_max": 0.090193, + "nauc_map_at_5_std": 0.066773, + "nauc_map_at_5_diff1": 0.063833, + "nauc_map_at_10_max": 0.088694, + "nauc_map_at_10_std": 0.077668, + "nauc_map_at_10_diff1": 0.058634, + "nauc_map_at_20_max": 0.087624, + "nauc_map_at_20_std": 0.081611, + "nauc_map_at_20_diff1": 0.056997, + "nauc_map_at_100_max": 0.08785, + "nauc_map_at_100_std": 0.08411, + "nauc_map_at_100_diff1": 0.057292, + "nauc_map_at_1000_max": 0.088087, + "nauc_map_at_1000_std": 0.084132, + "nauc_map_at_1000_diff1": 0.057518, + "nauc_recall_at_1_max": 0.508573, + "nauc_recall_at_1_std": -0.082507, + "nauc_recall_at_1_diff1": 0.76269, + "nauc_recall_at_3_max": 0.061538, + "nauc_recall_at_3_std": 0.080613, + "nauc_recall_at_3_diff1": 0.00021, + "nauc_recall_at_5_max": 0.042994, + "nauc_recall_at_5_std": 0.118279, + "nauc_recall_at_5_diff1": -0.034948, + "nauc_recall_at_10_max": 0.023206, + "nauc_recall_at_10_std": 0.16692, + "nauc_recall_at_10_diff1": -0.075879, + "nauc_recall_at_20_max": -0.000814, + "nauc_recall_at_20_std": 0.203607, + "nauc_recall_at_20_diff1": -0.110207, + "nauc_recall_at_100_max": -0.027256, + "nauc_recall_at_100_std": 0.286499, + "nauc_recall_at_100_diff1": -0.151039, + "nauc_recall_at_1000_max": -0.018936, + "nauc_recall_at_1000_std": 0.365426, + "nauc_recall_at_1000_diff1": -0.184487, + "nauc_precision_at_1_max": 0.508573, + "nauc_precision_at_1_std": -0.082507, + "nauc_precision_at_1_diff1": 0.76269, + "nauc_precision_at_3_max": 0.061538, + "nauc_precision_at_3_std": 0.080613, + "nauc_precision_at_3_diff1": 0.00021, + "nauc_precision_at_5_max": 0.042994, + "nauc_precision_at_5_std": 0.118279, + "nauc_precision_at_5_diff1": -0.034948, + "nauc_precision_at_10_max": 0.023206, + "nauc_precision_at_10_std": 0.16692, + "nauc_precision_at_10_diff1": -0.075879, + "nauc_precision_at_20_max": -0.000814, + "nauc_precision_at_20_std": 0.203607, + "nauc_precision_at_20_diff1": -0.110207, + "nauc_precision_at_100_max": -0.027256, + "nauc_precision_at_100_std": 0.286499, + "nauc_precision_at_100_diff1": -0.151039, + "nauc_precision_at_1000_max": -0.018936, + "nauc_precision_at_1000_std": 0.365426, + "nauc_precision_at_1000_diff1": -0.184487, + "nauc_mrr_at_1_max": 0.508573, + "nauc_mrr_at_1_std": -0.082507, + "nauc_mrr_at_1_diff1": 0.76269, + "nauc_mrr_at_3_max": 0.551033, + "nauc_mrr_at_3_std": -0.060482, + "nauc_mrr_at_3_diff1": 0.760133, + "nauc_mrr_at_5_max": 0.550519, + "nauc_mrr_at_5_std": -0.05638, + "nauc_mrr_at_5_diff1": 0.760237, + "nauc_mrr_at_10_max": 0.550312, + "nauc_mrr_at_10_std": -0.054272, + "nauc_mrr_at_10_diff1": 0.760893, + "nauc_mrr_at_20_max": 0.548681, + "nauc_mrr_at_20_std": -0.054868, + "nauc_mrr_at_20_diff1": 0.760881, + "nauc_mrr_at_100_max": 0.548329, + "nauc_mrr_at_100_std": -0.054955, + "nauc_mrr_at_100_diff1": 0.76083, + "nauc_mrr_at_1000_max": 0.548222, + "nauc_mrr_at_1000_std": -0.055147, + "nauc_mrr_at_1000_diff1": 0.760816, + "main_score": 0.70391, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 774.9631609916687, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ImdbClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ImdbClassification.json new file mode 100644 index 0000000000..387c35d0d1 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ImdbClassification.json @@ -0,0 +1,95 @@ +{ + "dataset_revision": "3d86128a09e091d6018b6d26cad27f2739fc2db7", + "task_name": "ImdbClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.8714, + "f1": 0.870781, + "f1_weighted": 0.870781, + "ap": 0.821529, + "ap_weighted": 0.821529, + "scores_per_experiment": [ + { + "accuracy": 0.86032, + "f1": 0.859256, + "f1_weighted": 0.859256, + "ap": 0.837325, + "ap_weighted": 0.837325 + }, + { + "accuracy": 0.87096, + "f1": 0.870376, + "f1_weighted": 0.870376, + "ap": 0.844429, + "ap_weighted": 0.844429 + }, + { + "accuracy": 0.88648, + "f1": 0.886234, + "f1_weighted": 0.886234, + "ap": 0.829903, + "ap_weighted": 0.829903 + }, + { + "accuracy": 0.89784, + "f1": 0.897813, + "f1_weighted": 0.897813, + "ap": 0.862537, + "ap_weighted": 0.862537 + }, + { + "accuracy": 0.90376, + "f1": 0.903705, + "f1_weighted": 0.903705, + "ap": 0.857459, + "ap_weighted": 0.857459 + }, + { + "accuracy": 0.88496, + "f1": 0.884895, + "f1_weighted": 0.884895, + "ap": 0.83393, + "ap_weighted": 0.83393 + }, + { + "accuracy": 0.88176, + "f1": 0.881582, + "f1_weighted": 0.881582, + "ap": 0.826146, + "ap_weighted": 0.826146 + }, + { + "accuracy": 0.8432, + "f1": 0.841572, + "f1_weighted": 0.841572, + "ap": 0.769533, + "ap_weighted": 0.769533 + }, + { + "accuracy": 0.8168, + "f1": 0.81452, + "f1_weighted": 0.81452, + "ap": 0.740546, + "ap_weighted": 0.740546 + }, + { + "accuracy": 0.86792, + "f1": 0.867853, + "f1_weighted": 0.867853, + "ap": 0.813481, + "ap_weighted": 0.813481 + } + ], + "main_score": 0.8714, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 11.841211318969727, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MSMARCO.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MSMARCO.json new file mode 100644 index 0000000000..d676edac60 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MSMARCO.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "c5a29a104738b98a9e76336939199e264163d4a0", + "task_name": "MSMARCO", + "mteb_version": "1.29.7", + "scores": { + "dev": [ + { + "ndcg_at_1": 0.21662, + "ndcg_at_3": 0.31891, + "ndcg_at_5": 0.36046, + "ndcg_at_10": 0.39927, + "ndcg_at_20": 0.42792, + "ndcg_at_100": 0.45915, + "ndcg_at_1000": 0.47172, + "map_at_1": 0.21112, + "map_at_3": 0.29111, + "map_at_5": 0.31437, + "map_at_10": 0.33072, + "map_at_20": 0.33882, + "map_at_100": 0.34334, + "map_at_1000": 0.34385, + "recall_at_1": 0.21112, + "recall_at_3": 0.39325, + "recall_at_5": 0.49306, + "recall_at_10": 0.61091, + "recall_at_20": 0.72178, + "recall_at_100": 0.88583, + "recall_at_1000": 0.98169, + "precision_at_1": 0.21662, + "precision_at_3": 0.13572, + "precision_at_5": 0.10258, + "precision_at_10": 0.06383, + "precision_at_20": 0.03789, + "precision_at_100": 0.00936, + "precision_at_1000": 0.00104, + "mrr_at_1": 0.216619, + "mrr_at_3": 0.297326, + "mrr_at_5": 0.320313, + "mrr_at_10": 0.336254, + "mrr_at_20": 0.344054, + "mrr_at_100": 0.348309, + "mrr_at_1000": 0.348762, + "nauc_ndcg_at_1_max": 0.043226, + "nauc_ndcg_at_1_std": -0.218788, + "nauc_ndcg_at_1_diff1": 0.351115, + "nauc_ndcg_at_3_max": 0.05556, + "nauc_ndcg_at_3_std": -0.244843, + "nauc_ndcg_at_3_diff1": 0.308127, + "nauc_ndcg_at_5_max": 0.065988, + "nauc_ndcg_at_5_std": -0.24563, + "nauc_ndcg_at_5_diff1": 0.307405, + "nauc_ndcg_at_10_max": 0.071935, + "nauc_ndcg_at_10_std": -0.242307, + "nauc_ndcg_at_10_diff1": 0.304748, + "nauc_ndcg_at_20_max": 0.080072, + "nauc_ndcg_at_20_std": -0.227504, + "nauc_ndcg_at_20_diff1": 0.307236, + "nauc_ndcg_at_100_max": 0.081841, + "nauc_ndcg_at_100_std": -0.208209, + "nauc_ndcg_at_100_diff1": 0.308025, + "nauc_ndcg_at_1000_max": 0.076037, + "nauc_ndcg_at_1000_std": -0.217613, + "nauc_ndcg_at_1000_diff1": 0.310597, + "nauc_map_at_1_max": 0.043461, + "nauc_map_at_1_std": -0.219072, + "nauc_map_at_1_diff1": 0.350199, + "nauc_map_at_3_max": 0.051587, + "nauc_map_at_3_std": -0.240597, + "nauc_map_at_3_diff1": 0.317288, + "nauc_map_at_5_max": 0.057408, + "nauc_map_at_5_std": -0.241635, + "nauc_map_at_5_diff1": 0.316792, + "nauc_map_at_10_max": 0.060121, + "nauc_map_at_10_std": -0.240097, + "nauc_map_at_10_diff1": 0.315906, + "nauc_map_at_20_max": 0.062302, + "nauc_map_at_20_std": -0.236045, + "nauc_map_at_20_diff1": 0.316919, + "nauc_map_at_100_max": 0.062479, + "nauc_map_at_100_std": -0.233313, + "nauc_map_at_100_diff1": 0.317152, + "nauc_map_at_1000_max": 0.062301, + "nauc_map_at_1000_std": -0.233527, + "nauc_map_at_1000_diff1": 0.317253, + "nauc_recall_at_1_max": 0.043461, + "nauc_recall_at_1_std": -0.219072, + "nauc_recall_at_1_diff1": 0.350199, + "nauc_recall_at_3_max": 0.066189, + "nauc_recall_at_3_std": -0.256482, + "nauc_recall_at_3_diff1": 0.283226, + "nauc_recall_at_5_max": 0.090366, + "nauc_recall_at_5_std": -0.255997, + "nauc_recall_at_5_diff1": 0.279833, + "nauc_recall_at_10_max": 0.109374, + "nauc_recall_at_10_std": -0.247349, + "nauc_recall_at_10_diff1": 0.266014, + "nauc_recall_at_20_max": 0.155941, + "nauc_recall_at_20_std": -0.17967, + "nauc_recall_at_20_diff1": 0.266741, + "nauc_recall_at_100_max": 0.262734, + "nauc_recall_at_100_std": 0.107535, + "nauc_recall_at_100_diff1": 0.234186, + "nauc_recall_at_1000_max": 0.51863, + "nauc_recall_at_1000_std": 0.566778, + "nauc_recall_at_1000_diff1": 0.162465, + "nauc_precision_at_1_max": 0.043226, + "nauc_precision_at_1_std": -0.218788, + "nauc_precision_at_1_diff1": 0.351115, + "nauc_precision_at_3_max": 0.065195, + "nauc_precision_at_3_std": -0.254486, + "nauc_precision_at_3_diff1": 0.280604, + "nauc_precision_at_5_max": 0.087787, + "nauc_precision_at_5_std": -0.250698, + "nauc_precision_at_5_diff1": 0.271712, + "nauc_precision_at_10_max": 0.107673, + "nauc_precision_at_10_std": -0.230408, + "nauc_precision_at_10_diff1": 0.250581, + "nauc_precision_at_20_max": 0.14922, + "nauc_precision_at_20_std": -0.143883, + "nauc_precision_at_20_diff1": 0.234929, + "nauc_precision_at_100_max": 0.186436, + "nauc_precision_at_100_std": 0.123126, + "nauc_precision_at_100_diff1": 0.128223, + "nauc_precision_at_1000_max": 0.102971, + "nauc_precision_at_1000_std": 0.16865, + "nauc_precision_at_1000_diff1": -0.023448, + "nauc_mrr_at_1_max": 0.043226, + "nauc_mrr_at_1_std": -0.218788, + "nauc_mrr_at_1_diff1": 0.351115, + "nauc_mrr_at_3_max": 0.051483, + "nauc_mrr_at_3_std": -0.238842, + "nauc_mrr_at_3_diff1": 0.317627, + "nauc_mrr_at_5_max": 0.057273, + "nauc_mrr_at_5_std": -0.239133, + "nauc_mrr_at_5_diff1": 0.317566, + "nauc_mrr_at_10_max": 0.059855, + "nauc_mrr_at_10_std": -0.237414, + "nauc_mrr_at_10_diff1": 0.316637, + "nauc_mrr_at_20_max": 0.061897, + "nauc_mrr_at_20_std": -0.233451, + "nauc_mrr_at_20_diff1": 0.317368, + "nauc_mrr_at_100_max": 0.061924, + "nauc_mrr_at_100_std": -0.23116, + "nauc_mrr_at_100_diff1": 0.317652, + "nauc_mrr_at_1000_max": 0.061728, + "nauc_mrr_at_1000_std": -0.231406, + "nauc_mrr_at_1000_diff1": 0.31777, + "main_score": 0.39927, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 1190.4523539543152, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MTOPDomainClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MTOPDomainClassification.json new file mode 100644 index 0000000000..5b7bfdc159 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MTOPDomainClassification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "d80d48c1eb48d3562165c59d59d0034df9fff0bf", + "task_name": "MTOPDomainClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.958254, + "f1": 0.954733, + "f1_weighted": 0.958445, + "scores_per_experiment": [ + { + "accuracy": 0.959416, + "f1": 0.955023, + "f1_weighted": 0.959655 + }, + { + "accuracy": 0.96352, + "f1": 0.960773, + "f1_weighted": 0.963638 + }, + { + "accuracy": 0.953944, + "f1": 0.951626, + "f1_weighted": 0.954012 + }, + { + "accuracy": 0.955312, + "f1": 0.950575, + "f1_weighted": 0.955628 + }, + { + "accuracy": 0.955312, + "f1": 0.951043, + "f1_weighted": 0.955476 + }, + { + "accuracy": 0.963292, + "f1": 0.96151, + "f1_weighted": 0.96358 + }, + { + "accuracy": 0.95896, + "f1": 0.953999, + "f1_weighted": 0.958922 + }, + { + "accuracy": 0.956224, + "f1": 0.951864, + "f1_weighted": 0.956457 + }, + { + "accuracy": 0.951892, + "f1": 0.950169, + "f1_weighted": 0.952262 + }, + { + "accuracy": 0.96466, + "f1": 0.960747, + "f1_weighted": 0.964818 + } + ], + "main_score": 0.958254, + "hf_subset": "en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 7.660795450210571, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MTOPIntentClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MTOPIntentClassification.json new file mode 100644 index 0000000000..a63ff50e8b --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MTOPIntentClassification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba", + "task_name": "MTOPIntentClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.811514, + "f1": 0.606791, + "f1_weighted": 0.838505, + "scores_per_experiment": [ + { + "accuracy": 0.817145, + "f1": 0.595502, + "f1_weighted": 0.84378 + }, + { + "accuracy": 0.826265, + "f1": 0.617449, + "f1_weighted": 0.85102 + }, + { + "accuracy": 0.80415, + "f1": 0.603526, + "f1_weighted": 0.834178 + }, + { + "accuracy": 0.80415, + "f1": 0.616834, + "f1_weighted": 0.830996 + }, + { + "accuracy": 0.816917, + "f1": 0.619772, + "f1_weighted": 0.842099 + }, + { + "accuracy": 0.80073, + "f1": 0.589994, + "f1_weighted": 0.828442 + }, + { + "accuracy": 0.817145, + "f1": 0.607429, + "f1_weighted": 0.846354 + }, + { + "accuracy": 0.825581, + "f1": 0.623426, + "f1_weighted": 0.849813 + }, + { + "accuracy": 0.808938, + "f1": 0.616289, + "f1_weighted": 0.840152 + }, + { + "accuracy": 0.794118, + "f1": 0.577688, + "f1_weighted": 0.818221 + } + ], + "main_score": 0.811514, + "hf_subset": "en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 14.307345151901245, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MassiveIntentClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MassiveIntentClassification.json new file mode 100644 index 0000000000..69f485ebc1 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MassiveIntentClassification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "4672e20407010da34463acc759c162ca9734bca6", + "task_name": "MassiveIntentClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.751849, + "f1": 0.728146, + "f1_weighted": 0.75029, + "scores_per_experiment": [ + { + "accuracy": 0.758911, + "f1": 0.746919, + "f1_weighted": 0.758839 + }, + { + "accuracy": 0.76967, + "f1": 0.73906, + "f1_weighted": 0.767113 + }, + { + "accuracy": 0.755884, + "f1": 0.725607, + "f1_weighted": 0.748286 + }, + { + "accuracy": 0.765636, + "f1": 0.736946, + "f1_weighted": 0.764232 + }, + { + "accuracy": 0.734701, + "f1": 0.716702, + "f1_weighted": 0.729695 + }, + { + "accuracy": 0.734364, + "f1": 0.717394, + "f1_weighted": 0.733615 + }, + { + "accuracy": 0.748823, + "f1": 0.732443, + "f1_weighted": 0.752166 + }, + { + "accuracy": 0.744116, + "f1": 0.712899, + "f1_weighted": 0.743968 + }, + { + "accuracy": 0.742771, + "f1": 0.715812, + "f1_weighted": 0.740779 + }, + { + "accuracy": 0.763618, + "f1": 0.737677, + "f1_weighted": 0.764204 + } + ], + "main_score": 0.751849, + "hf_subset": "en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 10.243975162506104, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MassiveScenarioClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MassiveScenarioClassification.json new file mode 100644 index 0000000000..0fb8a72eee --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MassiveScenarioClassification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "fad2c6e8459f9e1c45d9315f4953d921437d70f8", + "task_name": "MassiveScenarioClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.789576, + "f1": 0.788001, + "f1_weighted": 0.789665, + "scores_per_experiment": [ + { + "accuracy": 0.794553, + "f1": 0.79381, + "f1_weighted": 0.794574 + }, + { + "accuracy": 0.77774, + "f1": 0.781514, + "f1_weighted": 0.777436 + }, + { + "accuracy": 0.790182, + "f1": 0.784417, + "f1_weighted": 0.789449 + }, + { + "accuracy": 0.788164, + "f1": 0.783719, + "f1_weighted": 0.789268 + }, + { + "accuracy": 0.801278, + "f1": 0.792238, + "f1_weighted": 0.799958 + }, + { + "accuracy": 0.78043, + "f1": 0.779357, + "f1_weighted": 0.779643 + }, + { + "accuracy": 0.76698, + "f1": 0.772057, + "f1_weighted": 0.77167 + }, + { + "accuracy": 0.792535, + "f1": 0.789776, + "f1_weighted": 0.79271 + }, + { + "accuracy": 0.795898, + "f1": 0.795259, + "f1_weighted": 0.794476 + }, + { + "accuracy": 0.808003, + "f1": 0.807865, + "f1_weighted": 0.80747 + } + ], + "main_score": 0.789576, + "hf_subset": "en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 8.034817695617676, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MedrxivClusteringP2P.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..a375f4dded --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "task_name": "MedrxivClusteringP2P", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.326735, + "v_measure_std": 0.012048, + "v_measures": [ + 0.306045, + 0.317512, + 0.324717, + 0.317997, + 0.318162, + 0.342185, + 0.329899, + 0.341689, + 0.3443, + 0.324844 + ], + "main_score": 0.326735, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 16.154590368270874, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MedrxivClusteringS2S.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..6ac4d94370 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "task_name": "MedrxivClusteringS2S", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.319117, + "v_measure_std": 0.015943, + "v_measures": [ + 0.31141, + 0.301963, + 0.302396, + 0.294738, + 0.312545, + 0.342561, + 0.322683, + 0.336925, + 0.331054, + 0.334898 + ], + "main_score": 0.319117, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 6.766061305999756, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MindSmallReranking.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MindSmallReranking.json new file mode 100644 index 0000000000..a7e5781bea --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/MindSmallReranking.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "59042f120c80e8afa9cdbb224f67076cec0fc9a7", + "task_name": "MindSmallReranking", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "map": 0.319072, + "mrr": 0.333324, + "nAUC_map_max": -0.162607, + "nAUC_map_std": 0.089198, + "nAUC_map_diff1": 0.19362, + "nAUC_mrr_max": -0.104299, + "nAUC_mrr_std": 0.087359, + "nAUC_mrr_diff1": 0.173349, + "main_score": 0.319072, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 86.28712725639343, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/NFCorpus.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/NFCorpus.json new file mode 100644 index 0000000000..dad5edf310 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/NFCorpus.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "ec0fa4fe99da2ff19ca1214b7966684033a58814", + "task_name": "NFCorpus", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.43653, + "ndcg_at_3": 0.40013, + "ndcg_at_5": 0.37893, + "ndcg_at_10": 0.34322, + "ndcg_at_20": 0.32036, + "ndcg_at_100": 0.31207, + "ndcg_at_1000": 0.40242, + "map_at_1": 0.0501, + "map_at_3": 0.09124, + "map_at_5": 0.10724, + "map_at_10": 0.12477, + "map_at_20": 0.13905, + "map_at_100": 0.15819, + "map_at_1000": 0.17276, + "recall_at_1": 0.0501, + "recall_at_3": 0.10441, + "recall_at_5": 0.13046, + "recall_at_10": 0.16382, + "recall_at_20": 0.2053, + "recall_at_100": 0.31605, + "recall_at_1000": 0.64061, + "precision_at_1": 0.45511, + "precision_at_3": 0.3808, + "precision_at_5": 0.33498, + "precision_at_10": 0.25728, + "precision_at_20": 0.18994, + "precision_at_100": 0.08006, + "precision_at_1000": 0.02111, + "mrr_at_1": 0.455108, + "mrr_at_3": 0.520124, + "mrr_at_5": 0.53483, + "mrr_at_10": 0.541304, + "mrr_at_20": 0.545969, + "mrr_at_100": 0.547988, + "mrr_at_1000": 0.548392, + "nauc_ndcg_at_1_max": 0.545234, + "nauc_ndcg_at_1_std": 0.298372, + "nauc_ndcg_at_1_diff1": 0.335645, + "nauc_ndcg_at_3_max": 0.472261, + "nauc_ndcg_at_3_std": 0.319805, + "nauc_ndcg_at_3_diff1": 0.20545, + "nauc_ndcg_at_5_max": 0.469621, + "nauc_ndcg_at_5_std": 0.335314, + "nauc_ndcg_at_5_diff1": 0.189034, + "nauc_ndcg_at_10_max": 0.4486, + "nauc_ndcg_at_10_std": 0.329173, + "nauc_ndcg_at_10_diff1": 0.165467, + "nauc_ndcg_at_20_max": 0.431118, + "nauc_ndcg_at_20_std": 0.306349, + "nauc_ndcg_at_20_diff1": 0.179662, + "nauc_ndcg_at_100_max": 0.46171, + "nauc_ndcg_at_100_std": 0.315965, + "nauc_ndcg_at_100_diff1": 0.215357, + "nauc_ndcg_at_1000_max": 0.517896, + "nauc_ndcg_at_1000_std": 0.36524, + "nauc_ndcg_at_1000_diff1": 0.222831, + "nauc_map_at_1_max": 0.227167, + "nauc_map_at_1_std": -0.113868, + "nauc_map_at_1_diff1": 0.489197, + "nauc_map_at_3_max": 0.19304, + "nauc_map_at_3_std": -0.074142, + "nauc_map_at_3_diff1": 0.345418, + "nauc_map_at_5_max": 0.229616, + "nauc_map_at_5_std": -0.028081, + "nauc_map_at_5_diff1": 0.313199, + "nauc_map_at_10_max": 0.275933, + "nauc_map_at_10_std": 0.028797, + "nauc_map_at_10_diff1": 0.288555, + "nauc_map_at_20_max": 0.308369, + "nauc_map_at_20_std": 0.074318, + "nauc_map_at_20_diff1": 0.273614, + "nauc_map_at_100_max": 0.341572, + "nauc_map_at_100_std": 0.143824, + "nauc_map_at_100_diff1": 0.249925, + "nauc_map_at_1000_max": 0.349018, + "nauc_map_at_1000_std": 0.183159, + "nauc_map_at_1000_diff1": 0.234325, + "nauc_recall_at_1_max": 0.227167, + "nauc_recall_at_1_std": -0.113868, + "nauc_recall_at_1_diff1": 0.489197, + "nauc_recall_at_3_max": 0.149612, + "nauc_recall_at_3_std": -0.072511, + "nauc_recall_at_3_diff1": 0.276835, + "nauc_recall_at_5_max": 0.171114, + "nauc_recall_at_5_std": -0.019622, + "nauc_recall_at_5_diff1": 0.232889, + "nauc_recall_at_10_max": 0.207084, + "nauc_recall_at_10_std": 0.031663, + "nauc_recall_at_10_diff1": 0.213438, + "nauc_recall_at_20_max": 0.24863, + "nauc_recall_at_20_std": 0.060787, + "nauc_recall_at_20_diff1": 0.235668, + "nauc_recall_at_100_max": 0.291143, + "nauc_recall_at_100_std": 0.187496, + "nauc_recall_at_100_diff1": 0.164727, + "nauc_recall_at_1000_max": 0.221802, + "nauc_recall_at_1000_std": 0.178852, + "nauc_recall_at_1000_diff1": 0.08906, + "nauc_precision_at_1_max": 0.554973, + "nauc_precision_at_1_std": 0.308551, + "nauc_precision_at_1_diff1": 0.325478, + "nauc_precision_at_3_max": 0.454757, + "nauc_precision_at_3_std": 0.364839, + "nauc_precision_at_3_diff1": 0.095995, + "nauc_precision_at_5_max": 0.45189, + "nauc_precision_at_5_std": 0.408373, + "nauc_precision_at_5_diff1": 0.053687, + "nauc_precision_at_10_max": 0.41768, + "nauc_precision_at_10_std": 0.432962, + "nauc_precision_at_10_diff1": -0.02111, + "nauc_precision_at_20_max": 0.358643, + "nauc_precision_at_20_std": 0.452243, + "nauc_precision_at_20_diff1": -0.057548, + "nauc_precision_at_100_max": 0.216903, + "nauc_precision_at_100_std": 0.468247, + "nauc_precision_at_100_diff1": -0.118372, + "nauc_precision_at_1000_max": 0.063224, + "nauc_precision_at_1000_std": 0.371183, + "nauc_precision_at_1000_diff1": -0.144972, + "nauc_mrr_at_1_max": 0.554973, + "nauc_mrr_at_1_std": 0.308551, + "nauc_mrr_at_1_diff1": 0.325478, + "nauc_mrr_at_3_max": 0.547941, + "nauc_mrr_at_3_std": 0.340974, + "nauc_mrr_at_3_diff1": 0.287223, + "nauc_mrr_at_5_max": 0.551404, + "nauc_mrr_at_5_std": 0.35061, + "nauc_mrr_at_5_diff1": 0.289225, + "nauc_mrr_at_10_max": 0.555271, + "nauc_mrr_at_10_std": 0.355494, + "nauc_mrr_at_10_diff1": 0.292475, + "nauc_mrr_at_20_max": 0.560473, + "nauc_mrr_at_20_std": 0.355526, + "nauc_mrr_at_20_diff1": 0.29785, + "nauc_mrr_at_100_max": 0.560596, + "nauc_mrr_at_100_std": 0.355326, + "nauc_mrr_at_100_diff1": 0.298412, + "nauc_mrr_at_1000_max": 0.560283, + "nauc_mrr_at_1000_std": 0.35501, + "nauc_mrr_at_1000_diff1": 0.29835, + "main_score": 0.34322, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 1.5563993453979492, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/NQ.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/NQ.json new file mode 100644 index 0000000000..418257a94c --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/NQ.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "b774495ed302d8c44a3a7ea25c90dbce03968f31", + "task_name": "NQ", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.36645, + "ndcg_at_3": 0.47927, + "ndcg_at_5": 0.52574, + "ndcg_at_10": 0.56103, + "ndcg_at_20": 0.58166, + "ndcg_at_100": 0.60271, + "ndcg_at_1000": 0.6078, + "map_at_1": 0.32537, + "map_at_3": 0.43959, + "map_at_5": 0.46772, + "map_at_10": 0.48393, + "map_at_20": 0.49042, + "map_at_100": 0.49391, + "map_at_1000": 0.49415, + "recall_at_1": 0.32537, + "recall_at_3": 0.56163, + "recall_at_5": 0.6686, + "recall_at_10": 0.77059, + "recall_at_20": 0.84671, + "recall_at_100": 0.95133, + "recall_at_1000": 0.98846, + "precision_at_1": 0.36645, + "precision_at_3": 0.21852, + "precision_at_5": 0.15788, + "precision_at_10": 0.09206, + "precision_at_20": 0.051, + "precision_at_100": 0.01154, + "precision_at_1000": 0.0012, + "mrr_at_1": 0.366744, + "mrr_at_3": 0.471514, + "mrr_at_5": 0.494993, + "mrr_at_10": 0.507977, + "mrr_at_20": 0.512692, + "mrr_at_100": 0.515234, + "mrr_at_1000": 0.515385, + "nauc_ndcg_at_1_max": 0.189226, + "nauc_ndcg_at_1_std": -0.036295, + "nauc_ndcg_at_1_diff1": 0.373257, + "nauc_ndcg_at_3_max": 0.223289, + "nauc_ndcg_at_3_std": -0.024796, + "nauc_ndcg_at_3_diff1": 0.326934, + "nauc_ndcg_at_5_max": 0.237028, + "nauc_ndcg_at_5_std": -0.011018, + "nauc_ndcg_at_5_diff1": 0.325501, + "nauc_ndcg_at_10_max": 0.244799, + "nauc_ndcg_at_10_std": 0.000379, + "nauc_ndcg_at_10_diff1": 0.326484, + "nauc_ndcg_at_20_max": 0.2461, + "nauc_ndcg_at_20_std": 0.009214, + "nauc_ndcg_at_20_diff1": 0.326888, + "nauc_ndcg_at_100_max": 0.242681, + "nauc_ndcg_at_100_std": 0.010186, + "nauc_ndcg_at_100_diff1": 0.330203, + "nauc_ndcg_at_1000_max": 0.237073, + "nauc_ndcg_at_1000_std": 0.002785, + "nauc_ndcg_at_1000_diff1": 0.331759, + "nauc_map_at_1_max": 0.180555, + "nauc_map_at_1_std": -0.055552, + "nauc_map_at_1_diff1": 0.375201, + "nauc_map_at_3_max": 0.215202, + "nauc_map_at_3_std": -0.034859, + "nauc_map_at_3_diff1": 0.339014, + "nauc_map_at_5_max": 0.222429, + "nauc_map_at_5_std": -0.025567, + "nauc_map_at_5_diff1": 0.337601, + "nauc_map_at_10_max": 0.225438, + "nauc_map_at_10_std": -0.020475, + "nauc_map_at_10_diff1": 0.338005, + "nauc_map_at_20_max": 0.225626, + "nauc_map_at_20_std": -0.017893, + "nauc_map_at_20_diff1": 0.338339, + "nauc_map_at_100_max": 0.225058, + "nauc_map_at_100_std": -0.017815, + "nauc_map_at_100_diff1": 0.338803, + "nauc_map_at_1000_max": 0.22487, + "nauc_map_at_1000_std": -0.018038, + "nauc_map_at_1000_diff1": 0.338863, + "nauc_recall_at_1_max": 0.180555, + "nauc_recall_at_1_std": -0.055552, + "nauc_recall_at_1_diff1": 0.375201, + "nauc_recall_at_3_max": 0.243333, + "nauc_recall_at_3_std": -0.014221, + "nauc_recall_at_3_diff1": 0.285468, + "nauc_recall_at_5_max": 0.28366, + "nauc_recall_at_5_std": 0.020442, + "nauc_recall_at_5_diff1": 0.275899, + "nauc_recall_at_10_max": 0.329763, + "nauc_recall_at_10_std": 0.073888, + "nauc_recall_at_10_diff1": 0.265756, + "nauc_recall_at_20_max": 0.375217, + "nauc_recall_at_20_std": 0.159887, + "nauc_recall_at_20_diff1": 0.247389, + "nauc_recall_at_100_max": 0.565202, + "nauc_recall_at_100_std": 0.467924, + "nauc_recall_at_100_diff1": 0.218389, + "nauc_recall_at_1000_max": 0.711546, + "nauc_recall_at_1000_std": 0.706281, + "nauc_recall_at_1000_diff1": 0.148605, + "nauc_precision_at_1_max": 0.189226, + "nauc_precision_at_1_std": -0.036295, + "nauc_precision_at_1_diff1": 0.373257, + "nauc_precision_at_3_max": 0.219783, + "nauc_precision_at_3_std": 0.029921, + "nauc_precision_at_3_diff1": 0.22453, + "nauc_precision_at_5_max": 0.215101, + "nauc_precision_at_5_std": 0.072679, + "nauc_precision_at_5_diff1": 0.16884, + "nauc_precision_at_10_max": 0.198251, + "nauc_precision_at_10_std": 0.118565, + "nauc_precision_at_10_diff1": 0.108838, + "nauc_precision_at_20_max": 0.165984, + "nauc_precision_at_20_std": 0.165576, + "nauc_precision_at_20_diff1": 0.048186, + "nauc_precision_at_100_max": 0.083974, + "nauc_precision_at_100_std": 0.194311, + "nauc_precision_at_100_diff1": -0.043856, + "nauc_precision_at_1000_max": 0.011485, + "nauc_precision_at_1000_std": 0.143047, + "nauc_precision_at_1000_diff1": -0.081105, + "nauc_mrr_at_1_max": 0.190135, + "nauc_mrr_at_1_std": -0.036876, + "nauc_mrr_at_1_diff1": 0.372394, + "nauc_mrr_at_3_max": 0.212892, + "nauc_mrr_at_3_std": -0.015873, + "nauc_mrr_at_3_diff1": 0.335751, + "nauc_mrr_at_5_max": 0.219635, + "nauc_mrr_at_5_std": -0.011093, + "nauc_mrr_at_5_diff1": 0.33665, + "nauc_mrr_at_10_max": 0.221534, + "nauc_mrr_at_10_std": -0.009106, + "nauc_mrr_at_10_diff1": 0.338318, + "nauc_mrr_at_20_max": 0.221472, + "nauc_mrr_at_20_std": -0.008005, + "nauc_mrr_at_20_diff1": 0.338608, + "nauc_mrr_at_100_max": 0.220935, + "nauc_mrr_at_100_std": -0.008257, + "nauc_mrr_at_100_diff1": 0.339034, + "nauc_mrr_at_1000_max": 0.220792, + "nauc_mrr_at_1000_std": -0.00846, + "nauc_mrr_at_1000_diff1": 0.339087, + "main_score": 0.56103, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 301.574551820755, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/QuoraRetrieval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/QuoraRetrieval.json new file mode 100644 index 0000000000..af4934ce6b --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/QuoraRetrieval.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "e4e08e0b7dbe3c8700f0daef558ff32256715259", + "task_name": "QuoraRetrieval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.8119, + "ndcg_at_3": 0.85584, + "ndcg_at_5": 0.87172, + "ndcg_at_10": 0.88565, + "ndcg_at_20": 0.89193, + "ndcg_at_100": 0.8969, + "ndcg_at_1000": 0.89762, + "map_at_1": 0.70587, + "map_at_3": 0.81687, + "map_at_5": 0.83548, + "map_at_10": 0.84732, + "map_at_20": 0.85148, + "map_at_100": 0.85354, + "map_at_1000": 0.85368, + "recall_at_1": 0.70587, + "recall_at_3": 0.87518, + "recall_at_5": 0.91976, + "recall_at_10": 0.95996, + "recall_at_20": 0.97959, + "recall_at_100": 0.99709, + "recall_at_1000": 0.99976, + "precision_at_1": 0.8119, + "precision_at_3": 0.37493, + "precision_at_5": 0.24664, + "precision_at_10": 0.13498, + "precision_at_20": 0.07159, + "precision_at_100": 0.01533, + "precision_at_1000": 0.00157, + "mrr_at_1": 0.8118, + "mrr_at_3": 0.866133, + "mrr_at_5": 0.872698, + "mrr_at_10": 0.876009, + "mrr_at_20": 0.876614, + "mrr_at_100": 0.876837, + "mrr_at_1000": 0.876841, + "nauc_ndcg_at_1_max": 0.412548, + "nauc_ndcg_at_1_std": -0.357265, + "nauc_ndcg_at_1_diff1": 0.765052, + "nauc_ndcg_at_3_max": 0.404704, + "nauc_ndcg_at_3_std": -0.430197, + "nauc_ndcg_at_3_diff1": 0.749998, + "nauc_ndcg_at_5_max": 0.409364, + "nauc_ndcg_at_5_std": -0.440851, + "nauc_ndcg_at_5_diff1": 0.754498, + "nauc_ndcg_at_10_max": 0.410728, + "nauc_ndcg_at_10_std": -0.426508, + "nauc_ndcg_at_10_diff1": 0.753198, + "nauc_ndcg_at_20_max": 0.413008, + "nauc_ndcg_at_20_std": -0.41278, + "nauc_ndcg_at_20_diff1": 0.752466, + "nauc_ndcg_at_100_max": 0.413471, + "nauc_ndcg_at_100_std": -0.398417, + "nauc_ndcg_at_100_diff1": 0.752453, + "nauc_ndcg_at_1000_max": 0.413462, + "nauc_ndcg_at_1000_std": -0.39583, + "nauc_ndcg_at_1000_diff1": 0.751986, + "nauc_map_at_1_max": 0.308198, + "nauc_map_at_1_std": -0.387955, + "nauc_map_at_1_diff1": 0.788882, + "nauc_map_at_3_max": 0.376831, + "nauc_map_at_3_std": -0.453951, + "nauc_map_at_3_diff1": 0.764348, + "nauc_map_at_5_max": 0.390057, + "nauc_map_at_5_std": -0.452229, + "nauc_map_at_5_diff1": 0.762079, + "nauc_map_at_10_max": 0.396286, + "nauc_map_at_10_std": -0.437519, + "nauc_map_at_10_diff1": 0.758105, + "nauc_map_at_20_max": 0.400231, + "nauc_map_at_20_std": -0.425976, + "nauc_map_at_20_diff1": 0.756682, + "nauc_map_at_100_max": 0.401584, + "nauc_map_at_100_std": -0.418073, + "nauc_map_at_100_diff1": 0.755901, + "nauc_map_at_1000_max": 0.401678, + "nauc_map_at_1000_std": -0.417576, + "nauc_map_at_1000_diff1": 0.755815, + "nauc_recall_at_1_max": 0.308198, + "nauc_recall_at_1_std": -0.387955, + "nauc_recall_at_1_diff1": 0.788882, + "nauc_recall_at_3_max": 0.354496, + "nauc_recall_at_3_std": -0.533206, + "nauc_recall_at_3_diff1": 0.727091, + "nauc_recall_at_5_max": 0.36771, + "nauc_recall_at_5_std": -0.589987, + "nauc_recall_at_5_diff1": 0.719, + "nauc_recall_at_10_max": 0.377964, + "nauc_recall_at_10_std": -0.611771, + "nauc_recall_at_10_diff1": 0.708103, + "nauc_recall_at_20_max": 0.421849, + "nauc_recall_at_20_std": -0.577243, + "nauc_recall_at_20_diff1": 0.703409, + "nauc_recall_at_100_max": 0.460402, + "nauc_recall_at_100_std": -0.526955, + "nauc_recall_at_100_diff1": 0.711036, + "nauc_recall_at_1000_max": 0.471789, + "nauc_recall_at_1000_std": 0.66729, + "nauc_recall_at_1000_diff1": 0.181106, + "nauc_precision_at_1_max": 0.412548, + "nauc_precision_at_1_std": -0.357265, + "nauc_precision_at_1_diff1": 0.765052, + "nauc_precision_at_3_max": 0.085934, + "nauc_precision_at_3_std": 0.066223, + "nauc_precision_at_3_diff1": -0.178924, + "nauc_precision_at_5_max": 0.018243, + "nauc_precision_at_5_std": 0.168216, + "nauc_precision_at_5_diff1": -0.306048, + "nauc_precision_at_10_max": -0.033062, + "nauc_precision_at_10_std": 0.268177, + "nauc_precision_at_10_diff1": -0.389928, + "nauc_precision_at_20_max": -0.054235, + "nauc_precision_at_20_std": 0.327258, + "nauc_precision_at_20_diff1": -0.41662, + "nauc_precision_at_100_max": -0.079566, + "nauc_precision_at_100_std": 0.383197, + "nauc_precision_at_100_diff1": -0.433671, + "nauc_precision_at_1000_max": -0.085474, + "nauc_precision_at_1000_std": 0.391768, + "nauc_precision_at_1000_diff1": -0.437051, + "nauc_mrr_at_1_max": 0.409967, + "nauc_mrr_at_1_std": -0.356587, + "nauc_mrr_at_1_diff1": 0.765241, + "nauc_mrr_at_3_max": 0.421829, + "nauc_mrr_at_3_std": -0.380018, + "nauc_mrr_at_3_diff1": 0.753848, + "nauc_mrr_at_5_max": 0.421783, + "nauc_mrr_at_5_std": -0.380764, + "nauc_mrr_at_5_diff1": 0.75556, + "nauc_mrr_at_10_max": 0.420886, + "nauc_mrr_at_10_std": -0.37645, + "nauc_mrr_at_10_diff1": 0.755875, + "nauc_mrr_at_20_max": 0.420632, + "nauc_mrr_at_20_std": -0.375944, + "nauc_mrr_at_20_diff1": 0.756076, + "nauc_mrr_at_100_max": 0.420385, + "nauc_mrr_at_100_std": -0.3759, + "nauc_mrr_at_100_diff1": 0.756118, + "nauc_mrr_at_1000_max": 0.420378, + "nauc_mrr_at_1000_std": -0.375884, + "nauc_mrr_at_1000_diff1": 0.75612, + "main_score": 0.88565, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 115.79108762741089, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/RedditClustering.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/RedditClustering.json new file mode 100644 index 0000000000..4e419802bd --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "task_name": "RedditClustering", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.580886, + "v_measure_std": 0.043772, + "v_measures": [ + 0.587523, + 0.646064, + 0.517673, + 0.586823, + 0.570099, + 0.558642, + 0.596205, + 0.536522, + 0.552073, + 0.559743, + 0.54168, + 0.61089, + 0.566427, + 0.602002, + 0.682698, + 0.52719, + 0.602122, + 0.672474, + 0.572191, + 0.5439, + 0.532486, + 0.556079, + 0.645612, + 0.606588, + 0.548441 + ], + "main_score": 0.580886, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 29.885157585144043, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/RedditClusteringP2P.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/RedditClusteringP2P.json new file mode 100644 index 0000000000..ea8adf0eb1 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "task_name": "RedditClusteringP2P", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.656259, + "v_measure_std": 0.12463, + "v_measures": [ + 0.706985, + 0.713345, + 0.679923, + 0.417677, + 0.729404, + 0.664411, + 0.410366, + 0.764031, + 0.714972, + 0.761476 + ], + "main_score": 0.656259, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 60.45033025741577, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SCIDOCS.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SCIDOCS.json new file mode 100644 index 0000000000..4eebf2f7c4 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SCIDOCS.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88", + "task_name": "SCIDOCS", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.25, + "ndcg_at_3": 0.19659, + "ndcg_at_5": 0.1702, + "ndcg_at_10": 0.2044, + "ndcg_at_20": 0.23289, + "ndcg_at_100": 0.28684, + "ndcg_at_1000": 0.34285, + "map_at_1": 0.05083, + "map_at_3": 0.08868, + "map_at_5": 0.10546, + "map_at_10": 0.12218, + "map_at_20": 0.13276, + "map_at_100": 0.14331, + "map_at_1000": 0.14652, + "recall_at_1": 0.05083, + "recall_at_3": 0.10988, + "recall_at_5": 0.14868, + "recall_at_10": 0.21122, + "recall_at_20": 0.27787, + "recall_at_100": 0.45363, + "recall_at_1000": 0.7271, + "precision_at_1": 0.25, + "precision_at_3": 0.18067, + "precision_at_5": 0.1466, + "precision_at_10": 0.1043, + "precision_at_20": 0.06865, + "precision_at_100": 0.02232, + "precision_at_1000": 0.00358, + "mrr_at_1": 0.25, + "mrr_at_3": 0.321333, + "mrr_at_5": 0.339333, + "mrr_at_10": 0.355128, + "mrr_at_20": 0.361643, + "mrr_at_100": 0.366245, + "mrr_at_1000": 0.366794, + "nauc_ndcg_at_1_max": 0.258469, + "nauc_ndcg_at_1_std": 0.160481, + "nauc_ndcg_at_1_diff1": 0.217629, + "nauc_ndcg_at_3_max": 0.301403, + "nauc_ndcg_at_3_std": 0.190537, + "nauc_ndcg_at_3_diff1": 0.190835, + "nauc_ndcg_at_5_max": 0.311084, + "nauc_ndcg_at_5_std": 0.222895, + "nauc_ndcg_at_5_diff1": 0.173354, + "nauc_ndcg_at_10_max": 0.324311, + "nauc_ndcg_at_10_std": 0.262757, + "nauc_ndcg_at_10_diff1": 0.165408, + "nauc_ndcg_at_20_max": 0.334255, + "nauc_ndcg_at_20_std": 0.293054, + "nauc_ndcg_at_20_diff1": 0.163157, + "nauc_ndcg_at_100_max": 0.339497, + "nauc_ndcg_at_100_std": 0.35352, + "nauc_ndcg_at_100_diff1": 0.152621, + "nauc_ndcg_at_1000_max": 0.335897, + "nauc_ndcg_at_1000_std": 0.359828, + "nauc_ndcg_at_1000_diff1": 0.139005, + "nauc_map_at_1_max": 0.247816, + "nauc_map_at_1_std": 0.156148, + "nauc_map_at_1_diff1": 0.209187, + "nauc_map_at_3_max": 0.29637, + "nauc_map_at_3_std": 0.185069, + "nauc_map_at_3_diff1": 0.187118, + "nauc_map_at_5_max": 0.311209, + "nauc_map_at_5_std": 0.220674, + "nauc_map_at_5_diff1": 0.176358, + "nauc_map_at_10_max": 0.321868, + "nauc_map_at_10_std": 0.253603, + "nauc_map_at_10_diff1": 0.168725, + "nauc_map_at_20_max": 0.326776, + "nauc_map_at_20_std": 0.274817, + "nauc_map_at_20_diff1": 0.164063, + "nauc_map_at_100_max": 0.331624, + "nauc_map_at_100_std": 0.296231, + "nauc_map_at_100_diff1": 0.163123, + "nauc_map_at_1000_max": 0.331208, + "nauc_map_at_1000_std": 0.29861, + "nauc_map_at_1000_diff1": 0.16126, + "nauc_recall_at_1_max": 0.247816, + "nauc_recall_at_1_std": 0.156148, + "nauc_recall_at_1_diff1": 0.209187, + "nauc_recall_at_3_max": 0.310894, + "nauc_recall_at_3_std": 0.203372, + "nauc_recall_at_3_diff1": 0.171541, + "nauc_recall_at_5_max": 0.321874, + "nauc_recall_at_5_std": 0.254178, + "nauc_recall_at_5_diff1": 0.143268, + "nauc_recall_at_10_max": 0.327358, + "nauc_recall_at_10_std": 0.310942, + "nauc_recall_at_10_diff1": 0.1242, + "nauc_recall_at_20_max": 0.327534, + "nauc_recall_at_20_std": 0.351749, + "nauc_recall_at_20_diff1": 0.114072, + "nauc_recall_at_100_max": 0.28886, + "nauc_recall_at_100_std": 0.463744, + "nauc_recall_at_100_diff1": 0.065643, + "nauc_recall_at_1000_max": 0.235932, + "nauc_recall_at_1000_std": 0.487846, + "nauc_recall_at_1000_diff1": -0.029902, + "nauc_precision_at_1_max": 0.258469, + "nauc_precision_at_1_std": 0.160481, + "nauc_precision_at_1_diff1": 0.217629, + "nauc_precision_at_3_max": 0.319309, + "nauc_precision_at_3_std": 0.207627, + "nauc_precision_at_3_diff1": 0.177582, + "nauc_precision_at_5_max": 0.33114, + "nauc_precision_at_5_std": 0.258634, + "nauc_precision_at_5_diff1": 0.149615, + "nauc_precision_at_10_max": 0.334085, + "nauc_precision_at_10_std": 0.312686, + "nauc_precision_at_10_diff1": 0.128216, + "nauc_precision_at_20_max": 0.336113, + "nauc_precision_at_20_std": 0.354192, + "nauc_precision_at_20_diff1": 0.119683, + "nauc_precision_at_100_max": 0.299536, + "nauc_precision_at_100_std": 0.460862, + "nauc_precision_at_100_diff1": 0.071731, + "nauc_precision_at_1000_max": 0.24812, + "nauc_precision_at_1000_std": 0.472605, + "nauc_precision_at_1000_diff1": -0.019441, + "nauc_mrr_at_1_max": 0.258469, + "nauc_mrr_at_1_std": 0.160481, + "nauc_mrr_at_1_diff1": 0.217629, + "nauc_mrr_at_3_max": 0.27549, + "nauc_mrr_at_3_std": 0.173159, + "nauc_mrr_at_3_diff1": 0.201089, + "nauc_mrr_at_5_max": 0.278999, + "nauc_mrr_at_5_std": 0.18035, + "nauc_mrr_at_5_diff1": 0.1956, + "nauc_mrr_at_10_max": 0.283789, + "nauc_mrr_at_10_std": 0.189875, + "nauc_mrr_at_10_diff1": 0.196336, + "nauc_mrr_at_20_max": 0.286191, + "nauc_mrr_at_20_std": 0.191623, + "nauc_mrr_at_20_diff1": 0.198351, + "nauc_mrr_at_100_max": 0.284642, + "nauc_mrr_at_100_std": 0.191649, + "nauc_mrr_at_100_diff1": 0.197462, + "nauc_mrr_at_1000_max": 0.284539, + "nauc_mrr_at_1000_std": 0.191263, + "nauc_mrr_at_1000_diff1": 0.197599, + "main_score": 0.2044, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 4.624554634094238, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SICK-R.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SICK-R.json new file mode 100644 index 0000000000..d253ea8db7 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SICK-R.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "20a6d6f312dd54037fe07a32d58e5e168867909d", + "task_name": "SICK-R", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.837996, + "spearman": 0.757607, + "cosine_pearson": 0.837996, + "cosine_spearman": 0.757607, + "manhattan_pearson": 0.802659, + "manhattan_spearman": 0.7558, + "euclidean_pearson": 0.803501, + "euclidean_spearman": 0.756231, + "main_score": 0.757607, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 1.203150987625122, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS12.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS12.json new file mode 100644 index 0000000000..5e0b78501a --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS12.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", + "task_name": "STS12", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.80212, + "spearman": 0.748213, + "cosine_pearson": 0.80212, + "cosine_spearman": 0.748213, + "manhattan_pearson": 0.79011, + "manhattan_spearman": 0.745255, + "euclidean_pearson": 0.789511, + "euclidean_spearman": 0.744325, + "main_score": 0.748213, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.3792414665222168, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS13.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS13.json new file mode 100644 index 0000000000..4f40fe304a --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS13.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "7e90230a92c190f1bf69ae9002b8cea547a64cca", + "task_name": "STS13", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.8525, + "spearman": 0.866355, + "cosine_pearson": 0.8525, + "cosine_spearman": 0.866355, + "manhattan_pearson": 0.861504, + "manhattan_spearman": 0.863145, + "euclidean_pearson": 0.861214, + "euclidean_spearman": 0.862842, + "main_score": 0.866355, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.42250752449035645, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS14.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS14.json new file mode 100644 index 0000000000..8472788e9f --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS14.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "6031580fec1f6af667f0bd2da0a551cf4f0b2375", + "task_name": "STS14", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.814428, + "spearman": 0.787583, + "cosine_pearson": 0.814428, + "cosine_spearman": 0.787583, + "manhattan_pearson": 0.817136, + "manhattan_spearman": 0.786974, + "euclidean_pearson": 0.815923, + "euclidean_spearman": 0.785838, + "main_score": 0.787583, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.4137415885925293, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS15.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS15.json new file mode 100644 index 0000000000..51739f6a5e --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS15.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "ae752c7c21bf194d8b67fd573edf7ae58183cbe3", + "task_name": "STS15", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.823994, + "spearman": 0.853865, + "cosine_pearson": 0.823994, + "cosine_spearman": 0.853865, + "manhattan_pearson": 0.852366, + "manhattan_spearman": 0.856552, + "euclidean_pearson": 0.852288, + "euclidean_spearman": 0.856312, + "main_score": 0.853865, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.3460733890533447, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS16.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS16.json new file mode 100644 index 0000000000..ed8d758a89 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS16.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "4d8694f8f0e0100860b497b999b3dbed754a0513", + "task_name": "STS16", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.791962, + "spearman": 0.830956, + "cosine_pearson": 0.791962, + "cosine_spearman": 0.830956, + "manhattan_pearson": 0.82433, + "manhattan_spearman": 0.828628, + "euclidean_pearson": 0.825096, + "euclidean_spearman": 0.829352, + "main_score": 0.830956, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.2067854404449463, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS17.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS17.json new file mode 100644 index 0000000000..658814948c --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS17.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "faeb762787bd10488a50c8b5be4a3b82e411949c", + "task_name": "STS17", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.878808, + "spearman": 0.883035, + "cosine_pearson": 0.878808, + "cosine_spearman": 0.883035, + "manhattan_pearson": 0.876073, + "manhattan_spearman": 0.878386, + "euclidean_pearson": 0.876909, + "euclidean_spearman": 0.880923, + "main_score": 0.883035, + "hf_subset": "en-en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 22.920215845108032, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS22.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS22.json new file mode 100644 index 0000000000..fe333ae22a --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STS22.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3", + "task_name": "STS22", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.726476, + "spearman": 0.728422, + "cosine_pearson": 0.726476, + "cosine_spearman": 0.728422, + "manhattan_pearson": 0.736508, + "manhattan_spearman": 0.725433, + "euclidean_pearson": 0.736675, + "euclidean_spearman": 0.726016, + "main_score": 0.728422, + "hf_subset": "en", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.6105175018310547, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STSBenchmark.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STSBenchmark.json new file mode 100644 index 0000000000..154d023a70 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/STSBenchmark.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "b0fddb56ed78048fa8b90373c8a3cfc37b684831", + "task_name": "STSBenchmark", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.848412, + "spearman": 0.854068, + "cosine_pearson": 0.848412, + "cosine_spearman": 0.854068, + "manhattan_pearson": 0.856412, + "manhattan_spearman": 0.856715, + "euclidean_pearson": 0.856517, + "euclidean_spearman": 0.856771, + "main_score": 0.854068, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.19235491752624512, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SciDocsRR.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SciDocsRR.json new file mode 100644 index 0000000000..356fcdf0f6 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SciDocsRR.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "d3c5e1fc0b855ab6097bf1cda04dd73947d7caab", + "task_name": "SciDocsRR", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "map": 0.868347, + "mrr": 0.964288, + "nAUC_map_max": 0.537394, + "nAUC_map_std": 0.679598, + "nAUC_map_diff1": 0.008401, + "nAUC_mrr_max": 0.890159, + "nAUC_mrr_std": 0.818187, + "nAUC_mrr_diff1": 0.440473, + "main_score": 0.868347, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 5.28624701499939, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SciFact.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SciFact.json new file mode 100644 index 0000000000..5d9e194e28 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SciFact.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "0228b52cf27578f30900b9e5271d331663a030d7", + "task_name": "SciFact", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.65, + "ndcg_at_3": 0.71747, + "ndcg_at_5": 0.74288, + "ndcg_at_10": 0.7641, + "ndcg_at_20": 0.77575, + "ndcg_at_100": 0.78382, + "ndcg_at_1000": 0.78734, + "map_at_1": 0.61661, + "map_at_3": 0.6913, + "map_at_5": 0.7078, + "map_at_10": 0.7191, + "map_at_20": 0.7231, + "map_at_100": 0.72434, + "map_at_1000": 0.72449, + "recall_at_1": 0.61661, + "recall_at_3": 0.76322, + "recall_at_5": 0.82883, + "recall_at_10": 0.88922, + "recall_at_20": 0.93167, + "recall_at_100": 0.97333, + "recall_at_1000": 1.0, + "precision_at_1": 0.65, + "precision_at_3": 0.27889, + "precision_at_5": 0.18467, + "precision_at_10": 0.10067, + "precision_at_20": 0.053, + "precision_at_100": 0.01103, + "precision_at_1000": 0.00113, + "mrr_at_1": 0.65, + "mrr_at_3": 0.71, + "mrr_at_5": 0.724667, + "mrr_at_10": 0.730962, + "mrr_at_20": 0.733792, + "mrr_at_100": 0.734988, + "mrr_at_1000": 0.735137, + "nauc_ndcg_at_1_max": 0.579054, + "nauc_ndcg_at_1_std": -0.047609, + "nauc_ndcg_at_1_diff1": 0.74101, + "nauc_ndcg_at_3_max": 0.6059, + "nauc_ndcg_at_3_std": -0.079567, + "nauc_ndcg_at_3_diff1": 0.722102, + "nauc_ndcg_at_5_max": 0.61845, + "nauc_ndcg_at_5_std": -0.057745, + "nauc_ndcg_at_5_diff1": 0.713716, + "nauc_ndcg_at_10_max": 0.629298, + "nauc_ndcg_at_10_std": -0.029165, + "nauc_ndcg_at_10_diff1": 0.709786, + "nauc_ndcg_at_20_max": 0.629482, + "nauc_ndcg_at_20_std": 0.004764, + "nauc_ndcg_at_20_diff1": 0.706443, + "nauc_ndcg_at_100_max": 0.624548, + "nauc_ndcg_at_100_std": -0.011143, + "nauc_ndcg_at_100_diff1": 0.715598, + "nauc_ndcg_at_1000_max": 0.618894, + "nauc_ndcg_at_1000_std": -0.026415, + "nauc_ndcg_at_1000_diff1": 0.717109, + "nauc_map_at_1_max": 0.503702, + "nauc_map_at_1_std": -0.160483, + "nauc_map_at_1_diff1": 0.75645, + "nauc_map_at_3_max": 0.573965, + "nauc_map_at_3_std": -0.117385, + "nauc_map_at_3_diff1": 0.734594, + "nauc_map_at_5_max": 0.585882, + "nauc_map_at_5_std": -0.093833, + "nauc_map_at_5_diff1": 0.727075, + "nauc_map_at_10_max": 0.596179, + "nauc_map_at_10_std": -0.073981, + "nauc_map_at_10_diff1": 0.724943, + "nauc_map_at_20_max": 0.597303, + "nauc_map_at_20_std": -0.062932, + "nauc_map_at_20_diff1": 0.724153, + "nauc_map_at_100_max": 0.596522, + "nauc_map_at_100_std": -0.065082, + "nauc_map_at_100_diff1": 0.725345, + "nauc_map_at_1000_max": 0.596327, + "nauc_map_at_1000_std": -0.065603, + "nauc_map_at_1000_diff1": 0.725419, + "nauc_recall_at_1_max": 0.503702, + "nauc_recall_at_1_std": -0.160483, + "nauc_recall_at_1_diff1": 0.75645, + "nauc_recall_at_3_max": 0.613482, + "nauc_recall_at_3_std": -0.115438, + "nauc_recall_at_3_diff1": 0.701962, + "nauc_recall_at_5_max": 0.673441, + "nauc_recall_at_5_std": -0.012342, + "nauc_recall_at_5_diff1": 0.655745, + "nauc_recall_at_10_max": 0.745821, + "nauc_recall_at_10_std": 0.122023, + "nauc_recall_at_10_diff1": 0.62519, + "nauc_recall_at_20_max": 0.809865, + "nauc_recall_at_20_std": 0.535993, + "nauc_recall_at_20_diff1": 0.55157, + "nauc_recall_at_100_max": 0.91976, + "nauc_recall_at_100_std": 0.781746, + "nauc_recall_at_100_diff1": 0.645775, + "nauc_recall_at_1000_max": NaN, + "nauc_recall_at_1000_std": NaN, + "nauc_recall_at_1000_diff1": NaN, + "nauc_precision_at_1_max": 0.579054, + "nauc_precision_at_1_std": -0.047609, + "nauc_precision_at_1_diff1": 0.74101, + "nauc_precision_at_3_max": 0.567751, + "nauc_precision_at_3_std": 0.175911, + "nauc_precision_at_3_diff1": 0.379541, + "nauc_precision_at_5_max": 0.527373, + "nauc_precision_at_5_std": 0.343407, + "nauc_precision_at_5_diff1": 0.188048, + "nauc_precision_at_10_max": 0.421965, + "nauc_precision_at_10_std": 0.45853, + "nauc_precision_at_10_diff1": -0.002126, + "nauc_precision_at_20_max": 0.346183, + "nauc_precision_at_20_std": 0.597145, + "nauc_precision_at_20_diff1": -0.131309, + "nauc_precision_at_100_max": 0.265415, + "nauc_precision_at_100_std": 0.609777, + "nauc_precision_at_100_diff1": -0.236613, + "nauc_precision_at_1000_max": 0.188273, + "nauc_precision_at_1000_std": 0.589503, + "nauc_precision_at_1000_diff1": -0.34064, + "nauc_mrr_at_1_max": 0.579054, + "nauc_mrr_at_1_std": -0.047609, + "nauc_mrr_at_1_diff1": 0.74101, + "nauc_mrr_at_3_max": 0.617854, + "nauc_mrr_at_3_std": -0.039369, + "nauc_mrr_at_3_diff1": 0.721785, + "nauc_mrr_at_5_max": 0.628314, + "nauc_mrr_at_5_std": -0.021893, + "nauc_mrr_at_5_diff1": 0.716951, + "nauc_mrr_at_10_max": 0.624487, + "nauc_mrr_at_10_std": -0.020109, + "nauc_mrr_at_10_diff1": 0.716211, + "nauc_mrr_at_20_max": 0.623031, + "nauc_mrr_at_20_std": -0.014551, + "nauc_mrr_at_20_diff1": 0.716028, + "nauc_mrr_at_100_max": 0.622453, + "nauc_mrr_at_100_std": -0.016318, + "nauc_mrr_at_100_diff1": 0.717306, + "nauc_mrr_at_1000_max": 0.62227, + "nauc_mrr_at_1000_std": -0.016821, + "nauc_mrr_at_1000_diff1": 0.717376, + "main_score": 0.7641, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 1.6036255359649658, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SprintDuplicateQuestions.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SprintDuplicateQuestions.json new file mode 100644 index 0000000000..a08af3c0e4 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SprintDuplicateQuestions.json @@ -0,0 +1,58 @@ +{ + "dataset_revision": "d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46", + "task_name": "SprintDuplicateQuestions", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "similarity_accuracy": 0.998921, + "similarity_accuracy_threshold": 0.867819, + "similarity_f1": 0.946066, + "similarity_f1_threshold": 0.864817, + "similarity_precision": 0.936337, + "similarity_recall": 0.956, + "similarity_ap": 0.974051, + "cosine_accuracy": 0.998921, + "cosine_accuracy_threshold": 0.867819, + "cosine_f1": 0.946066, + "cosine_f1_threshold": 0.864817, + "cosine_precision": 0.936337, + "cosine_recall": 0.956, + "cosine_ap": 0.974051, + "manhattan_accuracy": 0.998901, + "manhattan_accuracy_threshold": 435.277649, + "manhattan_f1": 0.945239, + "manhattan_f1_threshold": 439.026031, + "manhattan_precision": 0.932814, + "manhattan_recall": 0.958, + "manhattan_ap": 0.974028, + "euclidean_accuracy": 0.998921, + "euclidean_accuracy_threshold": 19.425079, + "euclidean_f1": 0.945959, + "euclidean_f1_threshold": 19.683056, + "euclidean_precision": 0.938053, + "euclidean_recall": 0.954, + "euclidean_ap": 0.974055, + "dot_accuracy": 0.998762, + "dot_accuracy_threshold": 1251.746338, + "dot_f1": 0.937343, + "dot_f1_threshold": 1251.401367, + "dot_precision": 0.939698, + "dot_recall": 0.935, + "dot_ap": 0.970464, + "max_accuracy": 0.998921, + "max_f1": 0.946066, + "max_precision": 0.939698, + "max_recall": 0.958, + "max_ap": 0.974055, + "main_score": 0.974055, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 3.85636043548584, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackExchangeClustering.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackExchangeClustering.json new file mode 100644 index 0000000000..166675364e --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "task_name": "StackExchangeClustering", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.694833, + "v_measure_std": 0.040067, + "v_measures": [ + 0.747661, + 0.725212, + 0.622707, + 0.709454, + 0.705271, + 0.660527, + 0.6634, + 0.757293, + 0.686119, + 0.693125, + 0.783741, + 0.752432, + 0.752398, + 0.713827, + 0.636137, + 0.693086, + 0.670949, + 0.660356, + 0.672339, + 0.677046, + 0.698895, + 0.656881, + 0.669655, + 0.707226, + 0.655086 + ], + "main_score": 0.694833, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 26.905051708221436, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackExchangeClusteringP2P.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..a327613961 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "task_name": "StackExchangeClusteringP2P", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.357219, + "v_measure_std": 0.016781, + "v_measures": [ + 0.346163, + 0.34734, + 0.341462, + 0.333523, + 0.336519, + 0.378701, + 0.374152, + 0.372608, + 0.37029, + 0.371434 + ], + "main_score": 0.357219, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 24.401734113693237, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackOverflowDupQuestions.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackOverflowDupQuestions.json new file mode 100644 index 0000000000..c5b6f7b852 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackOverflowDupQuestions.json @@ -0,0 +1,26 @@ +{ + "dataset_revision": "e185fbe320c72810689fc5848eb6114e1ef5ec69", + "task_name": "StackOverflowDupQuestions", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "map": 0.548875, + "mrr": 0.559648, + "nAUC_map_max": 0.123841, + "nAUC_map_std": 0.100551, + "nAUC_map_diff1": 0.396629, + "nAUC_mrr_max": 0.136113, + "nAUC_mrr_std": 0.102842, + "nAUC_mrr_diff1": 0.394931, + "main_score": 0.548875, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 4.278441429138184, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackOverflowQA.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackOverflowQA.json new file mode 100644 index 0000000000..90faa10c52 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/StackOverflowQA.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "db8f169f3894c14a00251061f957b2063eef2bd5", + "task_name": "StackOverflowQA", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.85507, + "ndcg_at_3": 0.89517, + "ndcg_at_5": 0.903, + "ndcg_at_10": 0.90876, + "ndcg_at_20": 0.91167, + "ndcg_at_100": 0.91491, + "ndcg_at_1000": 0.91604, + "map_at_1": 0.85507, + "map_at_3": 0.88574, + "map_at_5": 0.89008, + "map_at_10": 0.8925, + "map_at_20": 0.89323, + "map_at_100": 0.89367, + "map_at_1000": 0.89372, + "recall_at_1": 0.85507, + "recall_at_3": 0.92227, + "recall_at_5": 0.94132, + "recall_at_10": 0.95888, + "recall_at_20": 0.97091, + "recall_at_100": 0.98847, + "recall_at_1000": 0.99749, + "precision_at_1": 0.85507, + "precision_at_3": 0.30742, + "precision_at_5": 0.18826, + "precision_at_10": 0.09589, + "precision_at_20": 0.04855, + "precision_at_100": 0.00988, + "precision_at_1000": 0.001, + "mrr_at_1": 0.855065, + "mrr_at_3": 0.885741, + "mrr_at_5": 0.890079, + "mrr_at_10": 0.892505, + "mrr_at_20": 0.893231, + "mrr_at_100": 0.893675, + "mrr_at_1000": 0.893715, + "nauc_ndcg_at_1_max": 0.859336, + "nauc_ndcg_at_1_std": 0.012345, + "nauc_ndcg_at_1_diff1": 0.920371, + "nauc_ndcg_at_3_max": 0.882135, + "nauc_ndcg_at_3_std": 0.065231, + "nauc_ndcg_at_3_diff1": 0.903041, + "nauc_ndcg_at_5_max": 0.881322, + "nauc_ndcg_at_5_std": 0.075221, + "nauc_ndcg_at_5_diff1": 0.904596, + "nauc_ndcg_at_10_max": 0.878573, + "nauc_ndcg_at_10_std": 0.079055, + "nauc_ndcg_at_10_diff1": 0.904556, + "nauc_ndcg_at_20_max": 0.877309, + "nauc_ndcg_at_20_std": 0.069308, + "nauc_ndcg_at_20_diff1": 0.905878, + "nauc_ndcg_at_100_max": 0.876707, + "nauc_ndcg_at_100_std": 0.070313, + "nauc_ndcg_at_100_diff1": 0.906815, + "nauc_ndcg_at_1000_max": 0.875858, + "nauc_ndcg_at_1000_std": 0.064697, + "nauc_ndcg_at_1000_diff1": 0.907402, + "nauc_map_at_1_max": 0.859336, + "nauc_map_at_1_std": 0.012345, + "nauc_map_at_1_diff1": 0.920371, + "nauc_map_at_3_max": 0.875156, + "nauc_map_at_3_std": 0.049876, + "nauc_map_at_3_diff1": 0.907415, + "nauc_map_at_5_max": 0.874388, + "nauc_map_at_5_std": 0.053981, + "nauc_map_at_5_diff1": 0.908289, + "nauc_map_at_10_max": 0.87328, + "nauc_map_at_10_std": 0.055176, + "nauc_map_at_10_diff1": 0.908368, + "nauc_map_at_20_max": 0.872952, + "nauc_map_at_20_std": 0.052894, + "nauc_map_at_20_diff1": 0.908661, + "nauc_map_at_100_max": 0.87292, + "nauc_map_at_100_std": 0.053197, + "nauc_map_at_100_diff1": 0.908781, + "nauc_map_at_1000_max": 0.872898, + "nauc_map_at_1000_std": 0.053035, + "nauc_map_at_1000_diff1": 0.908794, + "nauc_recall_at_1_max": 0.859336, + "nauc_recall_at_1_std": 0.012345, + "nauc_recall_at_1_diff1": 0.920371, + "nauc_recall_at_3_max": 0.911041, + "nauc_recall_at_3_std": 0.128343, + "nauc_recall_at_3_diff1": 0.885467, + "nauc_recall_at_5_max": 0.917877, + "nauc_recall_at_5_std": 0.189442, + "nauc_recall_at_5_diff1": 0.886371, + "nauc_recall_at_10_max": 0.914816, + "nauc_recall_at_10_std": 0.259318, + "nauc_recall_at_10_diff1": 0.878232, + "nauc_recall_at_20_max": 0.915141, + "nauc_recall_at_20_std": 0.216995, + "nauc_recall_at_20_diff1": 0.883783, + "nauc_recall_at_100_max": 0.942466, + "nauc_recall_at_100_std": 0.44601, + "nauc_recall_at_100_diff1": 0.886852, + "nauc_recall_at_1000_max": 0.947724, + "nauc_recall_at_1000_std": 0.338708, + "nauc_recall_at_1000_diff1": 0.973862, + "nauc_precision_at_1_max": 0.859336, + "nauc_precision_at_1_std": 0.012345, + "nauc_precision_at_1_diff1": 0.920371, + "nauc_precision_at_3_max": 0.911041, + "nauc_precision_at_3_std": 0.128343, + "nauc_precision_at_3_diff1": 0.885467, + "nauc_precision_at_5_max": 0.917877, + "nauc_precision_at_5_std": 0.189442, + "nauc_precision_at_5_diff1": 0.886371, + "nauc_precision_at_10_max": 0.914816, + "nauc_precision_at_10_std": 0.259318, + "nauc_precision_at_10_diff1": 0.878232, + "nauc_precision_at_20_max": 0.915141, + "nauc_precision_at_20_std": 0.216995, + "nauc_precision_at_20_diff1": 0.883783, + "nauc_precision_at_100_max": 0.942466, + "nauc_precision_at_100_std": 0.44601, + "nauc_precision_at_100_diff1": 0.886852, + "nauc_precision_at_1000_max": 0.947724, + "nauc_precision_at_1000_std": 0.338708, + "nauc_precision_at_1000_diff1": 0.973862, + "nauc_mrr_at_1_max": 0.859336, + "nauc_mrr_at_1_std": 0.012345, + "nauc_mrr_at_1_diff1": 0.920371, + "nauc_mrr_at_3_max": 0.875156, + "nauc_mrr_at_3_std": 0.049876, + "nauc_mrr_at_3_diff1": 0.907415, + "nauc_mrr_at_5_max": 0.874388, + "nauc_mrr_at_5_std": 0.053981, + "nauc_mrr_at_5_diff1": 0.908289, + "nauc_mrr_at_10_max": 0.87328, + "nauc_mrr_at_10_std": 0.055176, + "nauc_mrr_at_10_diff1": 0.908368, + "nauc_mrr_at_20_max": 0.872952, + "nauc_mrr_at_20_std": 0.052894, + "nauc_mrr_at_20_diff1": 0.908661, + "nauc_mrr_at_100_max": 0.87292, + "nauc_mrr_at_100_std": 0.053197, + "nauc_mrr_at_100_diff1": 0.908781, + "nauc_mrr_at_1000_max": 0.872898, + "nauc_mrr_at_1000_std": 0.053035, + "nauc_mrr_at_1000_diff1": 0.908794, + "main_score": 0.90876, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 12.350925207138062, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SummEval.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SummEval.json new file mode 100644 index 0000000000..601104b1be --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SummEval.json @@ -0,0 +1,24 @@ +{ + "dataset_revision": "cda12ad7615edc362dbf25a00fdd61d3b1eaf93c", + "task_name": "SummEval", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "pearson": 0.317721, + "spearman": 0.306854, + "cosine_spearman": 0.306854, + "cosine_pearson": 0.317721, + "dot_spearman": 0.306162, + "dot_pearson": 0.31185, + "main_score": 0.306854, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.5638136863708496, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SyntheticText2SQL.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SyntheticText2SQL.json new file mode 100644 index 0000000000..7a2b56e8db --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/SyntheticText2SQL.json @@ -0,0 +1,159 @@ +{ + "dataset_revision": "686b87296c3a0191b5d9415a00526c62db9fce09", + "task_name": "SyntheticText2SQL", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.13485, + "ndcg_at_3": 0.62325, + "ndcg_at_5": 0.63827, + "ndcg_at_10": 0.64685, + "ndcg_at_20": 0.64946, + "ndcg_at_100": 0.65044, + "ndcg_at_1000": 0.65057, + "map_at_1": 0.13485, + "map_at_3": 0.51797, + "map_at_5": 0.52637, + "map_at_10": 0.53004, + "map_at_20": 0.53079, + "map_at_100": 0.53095, + "map_at_1000": 0.53096, + "recall_at_1": 0.13485, + "recall_at_3": 0.92189, + "recall_at_5": 0.95813, + "recall_at_10": 0.98393, + "recall_at_20": 0.99402, + "recall_at_100": 0.99897, + "recall_at_1000": 1.0, + "precision_at_1": 0.13485, + "precision_at_3": 0.3073, + "precision_at_5": 0.19163, + "precision_at_10": 0.09839, + "precision_at_20": 0.0497, + "precision_at_100": 0.00999, + "precision_at_1000": 0.001, + "mrr_at_1": 0.468638, + "mrr_at_3": 0.6935, + "mrr_at_5": 0.700157, + "mrr_at_10": 0.703393, + "mrr_at_20": 0.70408, + "mrr_at_100": 0.704235, + "mrr_at_1000": 0.704241, + "nauc_ndcg_at_1_max": 0.042443, + "nauc_ndcg_at_1_std": -0.0555, + "nauc_ndcg_at_1_diff1": 0.589577, + "nauc_ndcg_at_3_max": 0.163479, + "nauc_ndcg_at_3_std": -0.262736, + "nauc_ndcg_at_3_diff1": -0.146196, + "nauc_ndcg_at_5_max": 0.153194, + "nauc_ndcg_at_5_std": -0.22759, + "nauc_ndcg_at_5_diff1": -0.032841, + "nauc_ndcg_at_10_max": 0.134905, + "nauc_ndcg_at_10_std": -0.19972, + "nauc_ndcg_at_10_diff1": 0.0556, + "nauc_ndcg_at_20_max": 0.127214, + "nauc_ndcg_at_20_std": -0.18818, + "nauc_ndcg_at_20_diff1": 0.088924, + "nauc_ndcg_at_100_max": 0.122523, + "nauc_ndcg_at_100_std": -0.186318, + "nauc_ndcg_at_100_diff1": 0.099933, + "nauc_ndcg_at_1000_max": 0.121603, + "nauc_ndcg_at_1000_std": -0.186752, + "nauc_ndcg_at_1000_diff1": 0.101901, + "nauc_map_at_1_max": 0.042443, + "nauc_map_at_1_std": -0.0555, + "nauc_map_at_1_diff1": 0.589577, + "nauc_map_at_3_max": 0.129445, + "nauc_map_at_3_std": -0.208883, + "nauc_map_at_3_diff1": 0.036997, + "nauc_map_at_5_max": 0.122938, + "nauc_map_at_5_std": -0.190012, + "nauc_map_at_5_diff1": 0.099187, + "nauc_map_at_10_max": 0.115822, + "nauc_map_at_10_std": -0.179779, + "nauc_map_at_10_diff1": 0.132159, + "nauc_map_at_20_max": 0.113902, + "nauc_map_at_20_std": -0.177164, + "nauc_map_at_20_diff1": 0.139925, + "nauc_map_at_100_max": 0.113352, + "nauc_map_at_100_std": -0.176831, + "nauc_map_at_100_diff1": 0.141379, + "nauc_map_at_1000_max": 0.113324, + "nauc_map_at_1000_std": -0.176835, + "nauc_map_at_1000_diff1": 0.141441, + "nauc_recall_at_1_max": 0.042443, + "nauc_recall_at_1_std": -0.0555, + "nauc_recall_at_1_diff1": 0.589577, + "nauc_recall_at_3_max": 0.354161, + "nauc_recall_at_3_std": -0.56016, + "nauc_recall_at_3_diff1": -1.149533, + "nauc_recall_at_5_max": 0.445477, + "nauc_recall_at_5_std": -0.56858, + "nauc_recall_at_5_diff1": -1.226276, + "nauc_recall_at_10_max": 0.541082, + "nauc_recall_at_10_std": -0.528129, + "nauc_recall_at_10_diff1": -1.284346, + "nauc_recall_at_20_max": 0.704297, + "nauc_recall_at_20_std": -0.260319, + "nauc_recall_at_20_diff1": -1.191931, + "nauc_recall_at_100_max": 0.89302, + "nauc_recall_at_100_std": 0.251976, + "nauc_recall_at_100_diff1": -1.544166, + "nauc_recall_at_1000_max": NaN, + "nauc_recall_at_1000_std": NaN, + "nauc_recall_at_1000_diff1": NaN, + "nauc_precision_at_1_max": 0.042443, + "nauc_precision_at_1_std": -0.0555, + "nauc_precision_at_1_diff1": 0.589577, + "nauc_precision_at_3_max": 0.354161, + "nauc_precision_at_3_std": -0.56016, + "nauc_precision_at_3_diff1": -1.149533, + "nauc_precision_at_5_max": 0.445477, + "nauc_precision_at_5_std": -0.56858, + "nauc_precision_at_5_diff1": -1.226276, + "nauc_precision_at_10_max": 0.541082, + "nauc_precision_at_10_std": -0.528129, + "nauc_precision_at_10_diff1": -1.284346, + "nauc_precision_at_20_max": 0.704297, + "nauc_precision_at_20_std": -0.260319, + "nauc_precision_at_20_diff1": -1.191931, + "nauc_precision_at_100_max": 0.89302, + "nauc_precision_at_100_std": 0.251976, + "nauc_precision_at_100_diff1": -1.544166, + "nauc_precision_at_1000_max": NaN, + "nauc_precision_at_1000_std": NaN, + "nauc_precision_at_1000_diff1": NaN, + "nauc_mrr_at_1_max": 0.077779, + "nauc_mrr_at_1_std": -0.101552, + "nauc_mrr_at_1_diff1": -0.167641, + "nauc_mrr_at_3_max": 0.128362, + "nauc_mrr_at_3_std": -0.187259, + "nauc_mrr_at_3_diff1": -0.355808, + "nauc_mrr_at_5_max": 0.124176, + "nauc_mrr_at_5_std": -0.173615, + "nauc_mrr_at_5_diff1": -0.333292, + "nauc_mrr_at_10_max": 0.119171, + "nauc_mrr_at_10_std": -0.167701, + "nauc_mrr_at_10_diff1": -0.319757, + "nauc_mrr_at_20_max": 0.1181, + "nauc_mrr_at_20_std": -0.166041, + "nauc_mrr_at_20_diff1": -0.316422, + "nauc_mrr_at_100_max": 0.117753, + "nauc_mrr_at_100_std": -0.165776, + "nauc_mrr_at_100_diff1": -0.315804, + "nauc_mrr_at_1000_max": 0.117734, + "nauc_mrr_at_1000_std": -0.165779, + "nauc_mrr_at_1000_diff1": -0.315773, + "main_score": 0.64685, + "hf_subset": "default", + "languages": [ + "eng-Latn", + "sql-Code" + ] + } + ] + }, + "evaluation_time": 36.36196184158325, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TRECCOVID.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TRECCOVID.json new file mode 100644 index 0000000000..9147ee8fee --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TRECCOVID.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "bb9466bac8153a0349341eb1b22e06409e78ef4e", + "task_name": "TRECCOVID", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.81, + "ndcg_at_3": 0.76927, + "ndcg_at_5": 0.767, + "ndcg_at_10": 0.75748, + "ndcg_at_20": 0.72276, + "ndcg_at_100": 0.57684, + "ndcg_at_1000": 0.51709, + "map_at_1": 0.00225, + "map_at_3": 0.0061, + "map_at_5": 0.01008, + "map_at_10": 0.01927, + "map_at_20": 0.03485, + "map_at_100": 0.11345, + "map_at_1000": 0.26512, + "recall_at_1": 0.00225, + "recall_at_3": 0.00638, + "recall_at_5": 0.01082, + "recall_at_10": 0.02143, + "recall_at_20": 0.03956, + "recall_at_100": 0.1456, + "recall_at_1000": 0.48548, + "precision_at_1": 0.86, + "precision_at_3": 0.80667, + "precision_at_5": 0.808, + "precision_at_10": 0.806, + "precision_at_20": 0.756, + "precision_at_100": 0.5938, + "precision_at_1000": 0.2253, + "mrr_at_1": 0.86, + "mrr_at_3": 0.906667, + "mrr_at_5": 0.906667, + "mrr_at_10": 0.906667, + "mrr_at_20": 0.907917, + "mrr_at_100": 0.907917, + "mrr_at_1000": 0.907917, + "nauc_ndcg_at_1_max": 0.488015, + "nauc_ndcg_at_1_std": 0.724806, + "nauc_ndcg_at_1_diff1": -0.081549, + "nauc_ndcg_at_3_max": 0.470185, + "nauc_ndcg_at_3_std": 0.751854, + "nauc_ndcg_at_3_diff1": -0.076831, + "nauc_ndcg_at_5_max": 0.403541, + "nauc_ndcg_at_5_std": 0.71221, + "nauc_ndcg_at_5_diff1": -0.105672, + "nauc_ndcg_at_10_max": 0.403529, + "nauc_ndcg_at_10_std": 0.672496, + "nauc_ndcg_at_10_diff1": -0.064097, + "nauc_ndcg_at_20_max": 0.409367, + "nauc_ndcg_at_20_std": 0.69772, + "nauc_ndcg_at_20_diff1": -0.070035, + "nauc_ndcg_at_100_max": 0.341197, + "nauc_ndcg_at_100_std": 0.747609, + "nauc_ndcg_at_100_diff1": -0.06647, + "nauc_ndcg_at_1000_max": 0.330588, + "nauc_ndcg_at_1000_std": 0.671889, + "nauc_ndcg_at_1000_diff1": -0.118661, + "nauc_map_at_1_max": 0.05649, + "nauc_map_at_1_std": 0.083537, + "nauc_map_at_1_diff1": -0.114739, + "nauc_map_at_3_max": 0.11654, + "nauc_map_at_3_std": 0.152909, + "nauc_map_at_3_diff1": -0.142754, + "nauc_map_at_5_max": 0.117468, + "nauc_map_at_5_std": 0.136636, + "nauc_map_at_5_diff1": -0.143756, + "nauc_map_at_10_max": 0.123048, + "nauc_map_at_10_std": 0.138796, + "nauc_map_at_10_diff1": -0.123402, + "nauc_map_at_20_max": 0.130006, + "nauc_map_at_20_std": 0.169494, + "nauc_map_at_20_diff1": -0.10144, + "nauc_map_at_100_max": 0.225332, + "nauc_map_at_100_std": 0.456099, + "nauc_map_at_100_diff1": -0.115984, + "nauc_map_at_1000_max": 0.319558, + "nauc_map_at_1000_std": 0.711252, + "nauc_map_at_1000_diff1": -0.12873, + "nauc_recall_at_1_max": 0.05649, + "nauc_recall_at_1_std": 0.083537, + "nauc_recall_at_1_diff1": -0.114739, + "nauc_recall_at_3_max": 0.076696, + "nauc_recall_at_3_std": 0.100304, + "nauc_recall_at_3_diff1": -0.155885, + "nauc_recall_at_5_max": 0.05858, + "nauc_recall_at_5_std": 0.06173, + "nauc_recall_at_5_diff1": -0.167811, + "nauc_recall_at_10_max": 0.044827, + "nauc_recall_at_10_std": 0.029474, + "nauc_recall_at_10_diff1": -0.134675, + "nauc_recall_at_20_max": 0.059332, + "nauc_recall_at_20_std": 0.066166, + "nauc_recall_at_20_diff1": -0.110565, + "nauc_recall_at_100_max": 0.147164, + "nauc_recall_at_100_std": 0.316315, + "nauc_recall_at_100_diff1": -0.135833, + "nauc_recall_at_1000_max": 0.294104, + "nauc_recall_at_1000_std": 0.538216, + "nauc_recall_at_1000_diff1": -0.141504, + "nauc_precision_at_1_max": 0.511016, + "nauc_precision_at_1_std": 0.851393, + "nauc_precision_at_1_diff1": -0.196203, + "nauc_precision_at_3_max": 0.495232, + "nauc_precision_at_3_std": 0.797375, + "nauc_precision_at_3_diff1": -0.169023, + "nauc_precision_at_5_max": 0.426881, + "nauc_precision_at_5_std": 0.744613, + "nauc_precision_at_5_diff1": -0.239086, + "nauc_precision_at_10_max": 0.436019, + "nauc_precision_at_10_std": 0.68697, + "nauc_precision_at_10_diff1": -0.138032, + "nauc_precision_at_20_max": 0.426572, + "nauc_precision_at_20_std": 0.688055, + "nauc_precision_at_20_diff1": -0.110141, + "nauc_precision_at_100_max": 0.360552, + "nauc_precision_at_100_std": 0.747532, + "nauc_precision_at_100_diff1": -0.061988, + "nauc_precision_at_1000_max": 0.277684, + "nauc_precision_at_1000_std": 0.504475, + "nauc_precision_at_1000_diff1": 0.025119, + "nauc_mrr_at_1_max": 0.511016, + "nauc_mrr_at_1_std": 0.851393, + "nauc_mrr_at_1_diff1": -0.196203, + "nauc_mrr_at_3_max": 0.400817, + "nauc_mrr_at_3_std": 0.839183, + "nauc_mrr_at_3_diff1": -0.347056, + "nauc_mrr_at_5_max": 0.400817, + "nauc_mrr_at_5_std": 0.839183, + "nauc_mrr_at_5_diff1": -0.347056, + "nauc_mrr_at_10_max": 0.400817, + "nauc_mrr_at_10_std": 0.839183, + "nauc_mrr_at_10_diff1": -0.347056, + "nauc_mrr_at_20_max": 0.414289, + "nauc_mrr_at_20_std": 0.840817, + "nauc_mrr_at_20_diff1": -0.327596, + "nauc_mrr_at_100_max": 0.414289, + "nauc_mrr_at_100_std": 0.840817, + "nauc_mrr_at_100_diff1": -0.327596, + "nauc_mrr_at_1000_max": 0.414289, + "nauc_mrr_at_1000_std": 0.840817, + "nauc_mrr_at_1000_diff1": -0.327596, + "main_score": 0.75748, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 17.784512042999268, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/Touche2020.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/Touche2020.json new file mode 100644 index 0000000000..168ce9592e --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/Touche2020.json @@ -0,0 +1,158 @@ +{ + "dataset_revision": "a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f", + "task_name": "Touche2020", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "ndcg_at_1": 0.15306, + "ndcg_at_3": 0.18397, + "ndcg_at_5": 0.17651, + "ndcg_at_10": 0.1797, + "ndcg_at_20": 0.20635, + "ndcg_at_100": 0.31764, + "ndcg_at_1000": 0.43965, + "map_at_1": 0.01601, + "map_at_3": 0.03694, + "map_at_5": 0.05014, + "map_at_10": 0.07164, + "map_at_20": 0.09271, + "map_at_100": 0.12998, + "map_at_1000": 0.14563, + "recall_at_1": 0.01601, + "recall_at_3": 0.04658, + "recall_at_5": 0.06988, + "recall_at_10": 0.12898, + "recall_at_20": 0.20726, + "recall_at_100": 0.44178, + "recall_at_1000": 0.81365, + "precision_at_1": 0.16327, + "precision_at_3": 0.20408, + "precision_at_5": 0.18367, + "precision_at_10": 0.16531, + "precision_at_20": 0.14388, + "precision_at_100": 0.07, + "precision_at_1000": 0.01496, + "mrr_at_1": 0.163265, + "mrr_at_3": 0.272109, + "mrr_at_5": 0.285374, + "mrr_at_10": 0.310593, + "mrr_at_20": 0.322977, + "mrr_at_100": 0.326395, + "mrr_at_1000": 0.326571, + "nauc_ndcg_at_1_max": -0.12872, + "nauc_ndcg_at_1_std": -0.183268, + "nauc_ndcg_at_1_diff1": 0.498385, + "nauc_ndcg_at_3_max": -0.102567, + "nauc_ndcg_at_3_std": -0.071274, + "nauc_ndcg_at_3_diff1": 0.318888, + "nauc_ndcg_at_5_max": -0.026734, + "nauc_ndcg_at_5_std": -0.072733, + "nauc_ndcg_at_5_diff1": 0.347003, + "nauc_ndcg_at_10_max": -0.057487, + "nauc_ndcg_at_10_std": -0.097217, + "nauc_ndcg_at_10_diff1": 0.348241, + "nauc_ndcg_at_20_max": -0.092235, + "nauc_ndcg_at_20_std": -0.036235, + "nauc_ndcg_at_20_diff1": 0.292401, + "nauc_ndcg_at_100_max": -0.120384, + "nauc_ndcg_at_100_std": 0.18406, + "nauc_ndcg_at_100_diff1": 0.298194, + "nauc_ndcg_at_1000_max": -0.071041, + "nauc_ndcg_at_1000_std": 0.279065, + "nauc_ndcg_at_1000_diff1": 0.286675, + "nauc_map_at_1_max": -0.102081, + "nauc_map_at_1_std": -0.213119, + "nauc_map_at_1_diff1": 0.321143, + "nauc_map_at_3_max": -0.059372, + "nauc_map_at_3_std": -0.162474, + "nauc_map_at_3_diff1": 0.260735, + "nauc_map_at_5_max": 0.003938, + "nauc_map_at_5_std": -0.149815, + "nauc_map_at_5_diff1": 0.297964, + "nauc_map_at_10_max": 0.045665, + "nauc_map_at_10_std": -0.142763, + "nauc_map_at_10_diff1": 0.293567, + "nauc_map_at_20_max": 0.022559, + "nauc_map_at_20_std": -0.096985, + "nauc_map_at_20_diff1": 0.293745, + "nauc_map_at_100_max": -0.021718, + "nauc_map_at_100_std": 0.03895, + "nauc_map_at_100_diff1": 0.314493, + "nauc_map_at_1000_max": -0.00661, + "nauc_map_at_1000_std": 0.078654, + "nauc_map_at_1000_diff1": 0.308554, + "nauc_recall_at_1_max": -0.102081, + "nauc_recall_at_1_std": -0.213119, + "nauc_recall_at_1_diff1": 0.321143, + "nauc_recall_at_3_max": -0.102755, + "nauc_recall_at_3_std": -0.122091, + "nauc_recall_at_3_diff1": 0.187628, + "nauc_recall_at_5_max": -0.034163, + "nauc_recall_at_5_std": -0.118007, + "nauc_recall_at_5_diff1": 0.253532, + "nauc_recall_at_10_max": -0.063663, + "nauc_recall_at_10_std": -0.140681, + "nauc_recall_at_10_diff1": 0.24485, + "nauc_recall_at_20_max": -0.117078, + "nauc_recall_at_20_std": -0.013762, + "nauc_recall_at_20_diff1": 0.179775, + "nauc_recall_at_100_max": -0.174605, + "nauc_recall_at_100_std": 0.321628, + "nauc_recall_at_100_diff1": 0.197526, + "nauc_recall_at_1000_max": -0.16108, + "nauc_recall_at_1000_std": 0.695903, + "nauc_recall_at_1000_diff1": 0.004621, + "nauc_precision_at_1_max": -0.099496, + "nauc_precision_at_1_std": -0.189418, + "nauc_precision_at_1_diff1": 0.459954, + "nauc_precision_at_3_max": -0.124122, + "nauc_precision_at_3_std": -0.028101, + "nauc_precision_at_3_diff1": 0.234271, + "nauc_precision_at_5_max": -0.000634, + "nauc_precision_at_5_std": -0.030772, + "nauc_precision_at_5_diff1": 0.308537, + "nauc_precision_at_10_max": -0.01626, + "nauc_precision_at_10_std": -0.003277, + "nauc_precision_at_10_diff1": 0.375037, + "nauc_precision_at_20_max": -0.079985, + "nauc_precision_at_20_std": 0.223445, + "nauc_precision_at_20_diff1": 0.232273, + "nauc_precision_at_100_max": -0.090233, + "nauc_precision_at_100_std": 0.615851, + "nauc_precision_at_100_diff1": 0.171047, + "nauc_precision_at_1000_max": 0.115137, + "nauc_precision_at_1000_std": 0.426656, + "nauc_precision_at_1000_diff1": -0.188415, + "nauc_mrr_at_1_max": -0.099496, + "nauc_mrr_at_1_std": -0.189418, + "nauc_mrr_at_1_diff1": 0.459954, + "nauc_mrr_at_3_max": -0.133684, + "nauc_mrr_at_3_std": -0.086698, + "nauc_mrr_at_3_diff1": 0.328809, + "nauc_mrr_at_5_max": -0.14383, + "nauc_mrr_at_5_std": -0.072054, + "nauc_mrr_at_5_diff1": 0.318755, + "nauc_mrr_at_10_max": -0.158034, + "nauc_mrr_at_10_std": -0.104043, + "nauc_mrr_at_10_diff1": 0.355078, + "nauc_mrr_at_20_max": -0.153904, + "nauc_mrr_at_20_std": -0.074295, + "nauc_mrr_at_20_diff1": 0.339144, + "nauc_mrr_at_100_max": -0.155374, + "nauc_mrr_at_100_std": -0.084205, + "nauc_mrr_at_100_diff1": 0.341865, + "nauc_mrr_at_1000_max": -0.154376, + "nauc_mrr_at_1000_std": -0.084904, + "nauc_mrr_at_1000_diff1": 0.341441, + "main_score": 0.1797, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 45.33574080467224, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ToxicConversationsClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ToxicConversationsClassification.json new file mode 100644 index 0000000000..b924cc473b --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/ToxicConversationsClassification.json @@ -0,0 +1,95 @@ +{ + "dataset_revision": "edfaf9da55d3dd50d43143d90c1ac476895ae6de", + "task_name": "ToxicConversationsClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.815381, + "f1": 0.637267, + "f1_weighted": 0.850335, + "ap": 0.210231, + "ap_weighted": 0.210231, + "scores_per_experiment": [ + { + "accuracy": 0.848633, + "f1": 0.661906, + "f1_weighted": 0.873415, + "ap": 0.224169, + "ap_weighted": 0.224169 + }, + { + "accuracy": 0.829102, + "f1": 0.638009, + "f1_weighted": 0.859409, + "ap": 0.198826, + "ap_weighted": 0.198826 + }, + { + "accuracy": 0.87793, + "f1": 0.696187, + "f1_weighted": 0.893993, + "ap": 0.260871, + "ap_weighted": 0.260871 + }, + { + "accuracy": 0.861816, + "f1": 0.685729, + "f1_weighted": 0.883756, + "ap": 0.257763, + "ap_weighted": 0.257763 + }, + { + "accuracy": 0.713867, + "f1": 0.557276, + "f1_weighted": 0.778921, + "ap": 0.157071, + "ap_weighted": 0.157071 + }, + { + "accuracy": 0.723145, + "f1": 0.572781, + "f1_weighted": 0.786136, + "ap": 0.176889, + "ap_weighted": 0.176889 + }, + { + "accuracy": 0.864746, + "f1": 0.674917, + "f1_weighted": 0.884032, + "ap": 0.23282, + "ap_weighted": 0.23282 + }, + { + "accuracy": 0.795898, + "f1": 0.618763, + "f1_weighted": 0.837518, + "ap": 0.194422, + "ap_weighted": 0.194422 + }, + { + "accuracy": 0.797852, + "f1": 0.61371, + "f1_weighted": 0.838222, + "ap": 0.183635, + "ap_weighted": 0.183635 + }, + { + "accuracy": 0.84082, + "f1": 0.653398, + "f1_weighted": 0.86795, + "ap": 0.215841, + "ap_weighted": 0.215841 + } + ], + "main_score": 0.815381, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 22.64286518096924, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TweetSentimentExtractionClassification.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TweetSentimentExtractionClassification.json new file mode 100644 index 0000000000..a839311551 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TweetSentimentExtractionClassification.json @@ -0,0 +1,73 @@ +{ + "dataset_revision": "d604517c81ca91fe16a244d1248fc021f9ecee7a", + "task_name": "TweetSentimentExtractionClassification", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "accuracy": 0.633164, + "f1": 0.636527, + "f1_weighted": 0.627267, + "scores_per_experiment": [ + { + "accuracy": 0.621109, + "f1": 0.620266, + "f1_weighted": 0.606565 + }, + { + "accuracy": 0.655631, + "f1": 0.658718, + "f1_weighted": 0.650522 + }, + { + "accuracy": 0.647991, + "f1": 0.652406, + "f1_weighted": 0.645691 + }, + { + "accuracy": 0.640634, + "f1": 0.646167, + "f1_weighted": 0.63723 + }, + { + "accuracy": 0.656197, + "f1": 0.660158, + "f1_weighted": 0.653504 + }, + { + "accuracy": 0.641483, + "f1": 0.645663, + "f1_weighted": 0.636478 + }, + { + "accuracy": 0.609508, + "f1": 0.610081, + "f1_weighted": 0.602421 + }, + { + "accuracy": 0.65931, + "f1": 0.664029, + "f1_weighted": 0.654971 + }, + { + "accuracy": 0.577533, + "f1": 0.580842, + "f1_weighted": 0.569163 + }, + { + "accuracy": 0.622241, + "f1": 0.62694, + "f1_weighted": 0.616126 + } + ], + "main_score": 0.633164, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 7.740556240081787, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwentyNewsgroupsClustering.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..ed4674582b --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "task_name": "TwentyNewsgroupsClustering", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "v_measure": 0.506715, + "v_measure_std": 0.009459, + "v_measures": [ + 0.491367, + 0.502601, + 0.52067, + 0.512605, + 0.516926, + 0.499317, + 0.496158, + 0.512195, + 0.500218, + 0.515089 + ], + "main_score": 0.506715, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 5.780537128448486, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwitterSemEval2015.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwitterSemEval2015.json new file mode 100644 index 0000000000..71799b5739 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwitterSemEval2015.json @@ -0,0 +1,58 @@ +{ + "dataset_revision": "70970daeab8776df92f5ea462b6173c0b46fd2d1", + "task_name": "TwitterSemEval2015", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "similarity_accuracy": 0.870299, + "similarity_accuracy_threshold": 0.902604, + "similarity_f1": 0.710123, + "similarity_f1_threshold": 0.880445, + "similarity_precision": 0.688647, + "similarity_recall": 0.732982, + "similarity_ap": 0.770643, + "cosine_accuracy": 0.870299, + "cosine_accuracy_threshold": 0.902604, + "cosine_f1": 0.710123, + "cosine_f1_threshold": 0.880445, + "cosine_precision": 0.688647, + "cosine_recall": 0.732982, + "cosine_ap": 0.770643, + "manhattan_accuracy": 0.87012, + "manhattan_accuracy_threshold": 385.482727, + "manhattan_f1": 0.707689, + "manhattan_f1_threshold": 432.180908, + "manhattan_precision": 0.65746, + "manhattan_recall": 0.766227, + "manhattan_ap": 0.768252, + "euclidean_accuracy": 0.870001, + "euclidean_accuracy_threshold": 17.374836, + "euclidean_f1": 0.70796, + "euclidean_f1_threshold": 18.802986, + "euclidean_precision": 0.697008, + "euclidean_recall": 0.719261, + "euclidean_ap": 0.767965, + "dot_accuracy": 0.86249, + "dot_accuracy_threshold": 1356.315674, + "dot_f1": 0.686449, + "dot_f1_threshold": 1330.348145, + "dot_precision": 0.663466, + "dot_recall": 0.711082, + "dot_ap": 0.744625, + "max_accuracy": 0.870299, + "max_f1": 0.710123, + "max_precision": 0.697008, + "max_recall": 0.766227, + "max_ap": 0.770643, + "main_score": 0.770643, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 0.9958534240722656, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwitterURLCorpus.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwitterURLCorpus.json new file mode 100644 index 0000000000..7a4995a3f1 --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/TwitterURLCorpus.json @@ -0,0 +1,58 @@ +{ + "dataset_revision": "8b6510b0b1fa4e4c4f879467980e9be563ec1cdf", + "task_name": "TwitterURLCorpus", + "mteb_version": "1.29.7", + "scores": { + "test": [ + { + "similarity_accuracy": 0.8794, + "similarity_accuracy_threshold": 0.921966, + "similarity_f1": 0.762279, + "similarity_f1_threshold": 0.904098, + "similarity_precision": 0.716931, + "similarity_recall": 0.813751, + "similarity_ap": 0.831839, + "cosine_accuracy": 0.8794, + "cosine_accuracy_threshold": 0.921966, + "cosine_f1": 0.762279, + "cosine_f1_threshold": 0.904098, + "cosine_precision": 0.716931, + "cosine_recall": 0.813751, + "cosine_ap": 0.831839, + "manhattan_accuracy": 0.880176, + "manhattan_accuracy_threshold": 343.594116, + "manhattan_f1": 0.763184, + "manhattan_f1_threshold": 364.531494, + "manhattan_precision": 0.734768, + "manhattan_recall": 0.793887, + "manhattan_ap": 0.833393, + "euclidean_accuracy": 0.879478, + "euclidean_accuracy_threshold": 15.324363, + "euclidean_f1": 0.763108, + "euclidean_f1_threshold": 16.658806, + "euclidean_precision": 0.729366, + "euclidean_recall": 0.800123, + "euclidean_ap": 0.832183, + "dot_accuracy": 0.863119, + "dot_accuracy_threshold": 1369.183838, + "dot_f1": 0.734985, + "dot_f1_threshold": 1344.360596, + "dot_precision": 0.679433, + "dot_recall": 0.800431, + "dot_ap": 0.784075, + "max_accuracy": 0.880176, + "max_f1": 0.763184, + "max_precision": 0.734768, + "max_recall": 0.813751, + "max_ap": 0.833393, + "main_score": 0.833393, + "hf_subset": "default", + "languages": [ + "eng-Latn" + ] + } + ] + }, + "evaluation_time": 3.1748311519622803, + "kg_co2_emissions": null +} \ No newline at end of file diff --git a/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/model_meta.json b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/model_meta.json new file mode 100644 index 0000000000..1e0af0138f --- /dev/null +++ b/results/Alibaba-NLP__gte-modernbert-base/7ca8b4ca700621b67618669f5378fe5f5820b8e4/model_meta.json @@ -0,0 +1,23 @@ +{ + "name": "Alibaba-NLP/gte-modernbert-base", + "revision": "7ca8b4ca700621b67618669f5378fe5f5820b8e4", + "release_date": "2025-01-21", + "languages": [ + "en" + ], + "loader": null, + "n_parameters": 149014272, + "memory_usage": null, + "max_tokens": 8192, + "embed_dim": 768, + "license": "apache-2.0", + "open_weights": true, + "public_training_data": false, + "public_training_code": false, + "framework": [ "PyTorch" + ], + "reference": "https://huggingface.co/Alibaba-NLP/gte-modernbert-base", + "similarity_fn_name": "cosine", + "use_instructions": false, + "zero_shot_benchmarks": null +}