File size: 5,957 Bytes
81d107a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 |
{
"dataset_revision": "ab518f4d6fcca38d87c25209f94beba119d02014",
"task_name": "HotpotQA",
"mteb_version": "1.25.1",
"scores": {
"test": [
{
"ndcg_at_1": 0.60162,
"ndcg_at_3": 0.44502,
"ndcg_at_5": 0.46295,
"ndcg_at_10": 0.47809,
"ndcg_at_20": 0.48903,
"ndcg_at_100": 0.50535,
"ndcg_at_1000": 0.51923,
"map_at_1": 0.30081,
"map_at_3": 0.36953,
"map_at_5": 0.38167,
"map_at_10": 0.38938,
"map_at_20": 0.39314,
"map_at_100": 0.39603,
"map_at_1000": 0.39663,
"recall_at_1": 0.30081,
"recall_at_3": 0.40614,
"recall_at_5": 0.44159,
"recall_at_10": 0.47961,
"recall_at_20": 0.51499,
"recall_at_100": 0.58731,
"recall_at_1000": 0.68035,
"precision_at_1": 0.60162,
"precision_at_3": 0.27076,
"precision_at_5": 0.17664,
"precision_at_10": 0.09592,
"precision_at_20": 0.0515,
"precision_at_100": 0.01175,
"precision_at_1000": 0.00136,
"mrr_at_1": 0.601621,
"mrr_at_3": 0.652622,
"mrr_at_5": 0.660826,
"mrr_at_10": 0.665901,
"mrr_at_20": 0.668133,
"mrr_at_100": 0.669551,
"mrr_at_1000": 0.669784,
"nauc_ndcg_at_1_max": 0.5116,
"nauc_ndcg_at_1_std": 0.073935,
"nauc_ndcg_at_1_diff1": 0.715694,
"nauc_ndcg_at_3_max": 0.378233,
"nauc_ndcg_at_3_std": 0.067468,
"nauc_ndcg_at_3_diff1": 0.494853,
"nauc_ndcg_at_5_max": 0.359559,
"nauc_ndcg_at_5_std": 0.073257,
"nauc_ndcg_at_5_diff1": 0.465013,
"nauc_ndcg_at_10_max": 0.339948,
"nauc_ndcg_at_10_std": 0.076042,
"nauc_ndcg_at_10_diff1": 0.443659,
"nauc_ndcg_at_20_max": 0.328131,
"nauc_ndcg_at_20_std": 0.074644,
"nauc_ndcg_at_20_diff1": 0.432222,
"nauc_ndcg_at_100_max": 0.312544,
"nauc_ndcg_at_100_std": 0.078449,
"nauc_ndcg_at_100_diff1": 0.415341,
"nauc_ndcg_at_1000_max": 0.305183,
"nauc_ndcg_at_1000_std": 0.078385,
"nauc_ndcg_at_1000_diff1": 0.409027,
"nauc_map_at_1_max": 0.5116,
"nauc_map_at_1_std": 0.073935,
"nauc_map_at_1_diff1": 0.715694,
"nauc_map_at_3_max": 0.334791,
"nauc_map_at_3_std": 0.058541,
"nauc_map_at_3_diff1": 0.444158,
"nauc_map_at_5_max": 0.31872,
"nauc_map_at_5_std": 0.060961,
"nauc_map_at_5_diff1": 0.421822,
"nauc_map_at_10_max": 0.307675,
"nauc_map_at_10_std": 0.06241,
"nauc_map_at_10_diff1": 0.410375,
"nauc_map_at_20_max": 0.303193,
"nauc_map_at_20_std": 0.061659,
"nauc_map_at_20_diff1": 0.406205,
"nauc_map_at_100_max": 0.299934,
"nauc_map_at_100_std": 0.062056,
"nauc_map_at_100_diff1": 0.402882,
"nauc_map_at_1000_max": 0.299604,
"nauc_map_at_1000_std": 0.06212,
"nauc_map_at_1000_diff1": 0.402604,
"nauc_recall_at_1_max": 0.5116,
"nauc_recall_at_1_std": 0.073935,
"nauc_recall_at_1_diff1": 0.715694,
"nauc_recall_at_3_max": 0.295614,
"nauc_recall_at_3_std": 0.061532,
"nauc_recall_at_3_diff1": 0.365997,
"nauc_recall_at_5_max": 0.250882,
"nauc_recall_at_5_std": 0.072136,
"nauc_recall_at_5_diff1": 0.296869,
"nauc_recall_at_10_max": 0.187916,
"nauc_recall_at_10_std": 0.075065,
"nauc_recall_at_10_diff1": 0.227623,
"nauc_recall_at_20_max": 0.139061,
"nauc_recall_at_20_std": 0.067366,
"nauc_recall_at_20_diff1": 0.176912,
"nauc_recall_at_100_max": 0.053559,
"nauc_recall_at_100_std": 0.077563,
"nauc_recall_at_100_diff1": 0.080251,
"nauc_recall_at_1000_max": -0.03957,
"nauc_recall_at_1000_std": 0.069824,
"nauc_recall_at_1000_diff1": -0.020025,
"nauc_precision_at_1_max": 0.5116,
"nauc_precision_at_1_std": 0.073935,
"nauc_precision_at_1_diff1": 0.715694,
"nauc_precision_at_3_max": 0.295614,
"nauc_precision_at_3_std": 0.061532,
"nauc_precision_at_3_diff1": 0.365997,
"nauc_precision_at_5_max": 0.250882,
"nauc_precision_at_5_std": 0.072136,
"nauc_precision_at_5_diff1": 0.296869,
"nauc_precision_at_10_max": 0.187916,
"nauc_precision_at_10_std": 0.075065,
"nauc_precision_at_10_diff1": 0.227623,
"nauc_precision_at_20_max": 0.139061,
"nauc_precision_at_20_std": 0.067366,
"nauc_precision_at_20_diff1": 0.176912,
"nauc_precision_at_100_max": 0.053559,
"nauc_precision_at_100_std": 0.077563,
"nauc_precision_at_100_diff1": 0.080251,
"nauc_precision_at_1000_max": -0.03957,
"nauc_precision_at_1000_std": 0.069824,
"nauc_precision_at_1000_diff1": -0.020025,
"nauc_mrr_at_1_max": 0.5116,
"nauc_mrr_at_1_std": 0.073935,
"nauc_mrr_at_1_diff1": 0.715694,
"nauc_mrr_at_3_max": 0.516213,
"nauc_mrr_at_3_std": 0.084836,
"nauc_mrr_at_3_diff1": 0.68779,
"nauc_mrr_at_5_max": 0.518266,
"nauc_mrr_at_5_std": 0.090287,
"nauc_mrr_at_5_diff1": 0.684759,
"nauc_mrr_at_10_max": 0.516795,
"nauc_mrr_at_10_std": 0.091841,
"nauc_mrr_at_10_diff1": 0.682263,
"nauc_mrr_at_20_max": 0.516508,
"nauc_mrr_at_20_std": 0.092047,
"nauc_mrr_at_20_diff1": 0.682142,
"nauc_mrr_at_100_max": 0.516723,
"nauc_mrr_at_100_std": 0.093048,
"nauc_mrr_at_100_diff1": 0.682074,
"nauc_mrr_at_1000_max": 0.516691,
"nauc_mrr_at_1000_std": 0.093012,
"nauc_mrr_at_1000_diff1": 0.682124,
"main_score": 0.47809,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 3732.872656583786,
"kg_co2_emissions": null
} |