Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

update NanoBEIR results #84

Merged
merged 1 commit into from
Jan 3, 2025
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
{
"dataset_revision": "8f4a982d470a32c45817738b9d29042ca55d75ad",
"task_name": "NanoArguAnaRetrieval",
"mteb_version": "1.23.2",
"mteb_version": "1.25.20",
"scores": {
"train": [
{
Expand Down Expand Up @@ -39,7 +39,7 @@
"mrr_at_10": 0.349595,
"mrr_at_20": 0.358099,
"mrr_at_100": 0.360406,
"mrr_at_1000": 0.360699,
"mrr_at_1000": 0.360697,
"nauc_ndcg_at_1_max": -0.326785,
"nauc_ndcg_at_1_std": -0.157071,
"nauc_ndcg_at_1_diff1": -0.373839,
Expand Down Expand Up @@ -142,9 +142,9 @@
"nauc_mrr_at_100_max": -0.043418,
"nauc_mrr_at_100_std": -0.092378,
"nauc_mrr_at_100_diff1": -0.127424,
"nauc_mrr_at_1000_max": -0.044506,
"nauc_mrr_at_1000_std": -0.092946,
"nauc_mrr_at_1000_diff1": -0.128607,
"nauc_mrr_at_1000_max": -0.044498,
"nauc_mrr_at_1000_std": -0.092939,
"nauc_mrr_at_1000_diff1": -0.128599,
"main_score": 0.44536,
"hf_subset": "default",
"languages": [
Expand All @@ -153,6 +153,6 @@
}
]
},
"evaluation_time": 62.61475086212158,
"evaluation_time": 18.93425226211548,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -1,158 +1,158 @@
{
"dataset_revision": "96741bfa30b9f56db8c9eb7d08e775ed6474f206",
"task_name": "NanoClimateFeverRetrieval",
"mteb_version": "1.23.2",
"mteb_version": "1.25.20",
"scores": {
"train": [
{
"ndcg_at_1": 0.14,
"ndcg_at_3": 0.18786,
"ndcg_at_5": 0.18786,
"ndcg_at_10": 0.2222,
"ndcg_at_20": 0.2529,
"ndcg_at_100": 0.30066,
"ndcg_at_1000": 0.32817,
"map_at_1": 0.14,
"map_at_3": 0.17667,
"map_at_5": 0.17667,
"map_at_10": 0.19202,
"map_at_20": 0.20067,
"map_at_100": 0.20693,
"map_at_1000": 0.20758,
"recall_at_1": 0.14,
"ndcg_at_1": 0.3,
"ndcg_at_3": 0.24304,
"ndcg_at_5": 0.26237,
"ndcg_at_10": 0.30643,
"ndcg_at_20": 0.35175,
"ndcg_at_100": 0.40716,
"ndcg_at_1000": 0.44742,
"map_at_1": 0.13667,
"map_at_3": 0.17889,
"map_at_5": 0.19619,
"map_at_10": 0.21763,
"map_at_20": 0.23124,
"map_at_100": 0.24215,
"map_at_1000": 0.24442,
"recall_at_1": 0.13667,
"recall_at_3": 0.22,
"recall_at_5": 0.22,
"recall_at_10": 0.32,
"recall_at_20": 0.44,
"recall_at_100": 0.7,
"recall_at_1000": 0.94,
"precision_at_1": 0.14,
"precision_at_3": 0.07333,
"precision_at_5": 0.044,
"precision_at_10": 0.032,
"precision_at_20": 0.022,
"precision_at_100": 0.007,
"precision_at_1000": 0.00094,
"mrr_at_1": 0.14,
"mrr_at_3": 0.176667,
"mrr_at_5": 0.176667,
"mrr_at_10": 0.192024,
"mrr_at_20": 0.200667,
"mrr_at_100": 0.206933,
"mrr_at_1000": 0.207577,
"nauc_ndcg_at_1_max": 0.324621,
"nauc_ndcg_at_1_std": 0.081718,
"nauc_ndcg_at_1_diff1": 0.321821,
"nauc_ndcg_at_3_max": 0.293153,
"nauc_ndcg_at_3_std": 0.109611,
"nauc_ndcg_at_3_diff1": 0.322017,
"nauc_ndcg_at_5_max": 0.293153,
"nauc_ndcg_at_5_std": 0.109611,
"nauc_ndcg_at_5_diff1": 0.322017,
"nauc_ndcg_at_10_max": 0.239257,
"nauc_ndcg_at_10_std": 0.130088,
"nauc_ndcg_at_10_diff1": 0.202381,
"nauc_ndcg_at_20_max": 0.189477,
"nauc_ndcg_at_20_std": 0.156023,
"nauc_ndcg_at_20_diff1": 0.218851,
"nauc_ndcg_at_100_max": 0.177323,
"nauc_ndcg_at_100_std": 0.140537,
"nauc_ndcg_at_100_diff1": 0.184873,
"nauc_ndcg_at_1000_max": 0.200843,
"nauc_ndcg_at_1000_std": 0.114844,
"nauc_ndcg_at_1000_diff1": 0.218372,
"nauc_map_at_1_max": 0.324621,
"nauc_map_at_1_std": 0.081718,
"nauc_map_at_1_diff1": 0.321821,
"nauc_map_at_3_max": 0.296776,
"nauc_map_at_3_std": 0.099373,
"nauc_map_at_3_diff1": 0.323464,
"nauc_map_at_5_max": 0.296776,
"nauc_map_at_5_std": 0.099373,
"nauc_map_at_5_diff1": 0.323464,
"nauc_map_at_10_max": 0.268693,
"nauc_map_at_10_std": 0.109821,
"nauc_map_at_10_diff1": 0.26528,
"nauc_map_at_20_max": 0.253475,
"nauc_map_at_20_std": 0.120122,
"nauc_map_at_20_diff1": 0.267912,
"nauc_map_at_100_max": 0.252658,
"nauc_map_at_100_std": 0.11747,
"nauc_map_at_100_diff1": 0.263096,
"nauc_map_at_1000_max": 0.254043,
"nauc_map_at_1000_std": 0.116815,
"nauc_map_at_1000_diff1": 0.263974,
"nauc_recall_at_1_max": 0.324621,
"nauc_recall_at_1_std": 0.081718,
"nauc_recall_at_1_diff1": 0.321821,
"nauc_recall_at_3_max": 0.285173,
"nauc_recall_at_3_std": 0.136619,
"nauc_recall_at_3_diff1": 0.317898,
"nauc_recall_at_5_max": 0.285173,
"nauc_recall_at_5_std": 0.136619,
"nauc_recall_at_5_diff1": 0.317898,
"nauc_recall_at_10_max": 0.165605,
"nauc_recall_at_10_std": 0.180697,
"nauc_recall_at_10_diff1": 0.03516,
"nauc_recall_at_20_max": 0.010101,
"nauc_recall_at_20_std": 0.248264,
"nauc_recall_at_20_diff1": 0.1032,
"nauc_recall_at_100_max": -0.134606,
"nauc_recall_at_100_std": 0.198559,
"nauc_recall_at_100_diff1": -0.125779,
"nauc_recall_at_1000_max": -0.530812,
"nauc_recall_at_1000_std": -0.51774,
"nauc_recall_at_1000_diff1": 0.037815,
"nauc_precision_at_1_max": 0.324621,
"nauc_precision_at_1_std": 0.081718,
"nauc_precision_at_1_diff1": 0.321821,
"nauc_precision_at_3_max": 0.285173,
"nauc_precision_at_3_std": 0.136619,
"nauc_precision_at_3_diff1": 0.317898,
"nauc_precision_at_5_max": 0.285173,
"nauc_precision_at_5_std": 0.136619,
"nauc_precision_at_5_diff1": 0.317898,
"nauc_precision_at_10_max": 0.165605,
"nauc_precision_at_10_std": 0.180697,
"nauc_precision_at_10_diff1": 0.03516,
"nauc_precision_at_20_max": 0.010101,
"nauc_precision_at_20_std": 0.248264,
"nauc_precision_at_20_diff1": 0.1032,
"nauc_precision_at_100_max": -0.134606,
"nauc_precision_at_100_std": 0.198559,
"nauc_precision_at_100_diff1": -0.125779,
"nauc_precision_at_1000_max": -0.530812,
"nauc_precision_at_1000_std": -0.51774,
"nauc_precision_at_1000_diff1": 0.037815,
"nauc_mrr_at_1_max": 0.324621,
"nauc_mrr_at_1_std": 0.081718,
"nauc_mrr_at_1_diff1": 0.321821,
"nauc_mrr_at_3_max": 0.296776,
"nauc_mrr_at_3_std": 0.099373,
"nauc_mrr_at_3_diff1": 0.323464,
"nauc_mrr_at_5_max": 0.296776,
"nauc_mrr_at_5_std": 0.099373,
"nauc_mrr_at_5_diff1": 0.323464,
"nauc_mrr_at_10_max": 0.268693,
"nauc_mrr_at_10_std": 0.109821,
"nauc_mrr_at_10_diff1": 0.26528,
"nauc_mrr_at_20_max": 0.253475,
"nauc_mrr_at_20_std": 0.120122,
"nauc_mrr_at_20_diff1": 0.267912,
"nauc_mrr_at_100_max": 0.252658,
"nauc_mrr_at_100_std": 0.11747,
"nauc_mrr_at_100_diff1": 0.263096,
"nauc_mrr_at_1000_max": 0.254043,
"nauc_mrr_at_1000_std": 0.116815,
"nauc_mrr_at_1000_diff1": 0.263974,
"main_score": 0.2222,
"recall_at_5": 0.274,
"recall_at_10": 0.37233,
"recall_at_20": 0.50533,
"recall_at_100": 0.71967,
"recall_at_1000": 0.95133,
"precision_at_1": 0.3,
"precision_at_3": 0.16,
"precision_at_5": 0.132,
"precision_at_10": 0.094,
"precision_at_20": 0.066,
"precision_at_100": 0.0202,
"precision_at_1000": 0.00278,
"mrr_at_1": 0.3,
"mrr_at_3": 0.363333,
"mrr_at_5": 0.391333,
"mrr_at_10": 0.40669,
"mrr_at_20": 0.419132,
"mrr_at_100": 0.422186,
"mrr_at_1000": 0.422216,
"nauc_ndcg_at_1_max": 0.181597,
"nauc_ndcg_at_1_std": 0.14798,
"nauc_ndcg_at_1_diff1": 0.293339,
"nauc_ndcg_at_3_max": 0.149632,
"nauc_ndcg_at_3_std": 0.097799,
"nauc_ndcg_at_3_diff1": 0.316385,
"nauc_ndcg_at_5_max": 0.210865,
"nauc_ndcg_at_5_std": 0.115939,
"nauc_ndcg_at_5_diff1": 0.346206,
"nauc_ndcg_at_10_max": 0.235673,
"nauc_ndcg_at_10_std": 0.154558,
"nauc_ndcg_at_10_diff1": 0.250718,
"nauc_ndcg_at_20_max": 0.240714,
"nauc_ndcg_at_20_std": 0.182953,
"nauc_ndcg_at_20_diff1": 0.252656,
"nauc_ndcg_at_100_max": 0.257965,
"nauc_ndcg_at_100_std": 0.209827,
"nauc_ndcg_at_100_diff1": 0.200714,
"nauc_ndcg_at_1000_max": 0.237272,
"nauc_ndcg_at_1000_std": 0.178112,
"nauc_ndcg_at_1000_diff1": 0.2442,
"nauc_map_at_1_max": 0.266133,
"nauc_map_at_1_std": 0.07396,
"nauc_map_at_1_diff1": 0.454136,
"nauc_map_at_3_max": 0.198254,
"nauc_map_at_3_std": 0.06462,
"nauc_map_at_3_diff1": 0.393445,
"nauc_map_at_5_max": 0.208258,
"nauc_map_at_5_std": 0.073492,
"nauc_map_at_5_diff1": 0.396923,
"nauc_map_at_10_max": 0.215698,
"nauc_map_at_10_std": 0.09792,
"nauc_map_at_10_diff1": 0.334522,
"nauc_map_at_20_max": 0.220486,
"nauc_map_at_20_std": 0.111722,
"nauc_map_at_20_diff1": 0.332673,
"nauc_map_at_100_max": 0.226479,
"nauc_map_at_100_std": 0.120319,
"nauc_map_at_100_diff1": 0.319103,
"nauc_map_at_1000_max": 0.226414,
"nauc_map_at_1000_std": 0.119015,
"nauc_map_at_1000_diff1": 0.32081,
"nauc_recall_at_1_max": 0.266133,
"nauc_recall_at_1_std": 0.07396,
"nauc_recall_at_1_diff1": 0.454136,
"nauc_recall_at_3_max": 0.148535,
"nauc_recall_at_3_std": 0.082401,
"nauc_recall_at_3_diff1": 0.294734,
"nauc_recall_at_5_max": 0.22616,
"nauc_recall_at_5_std": 0.124862,
"nauc_recall_at_5_diff1": 0.301651,
"nauc_recall_at_10_max": 0.284796,
"nauc_recall_at_10_std": 0.194855,
"nauc_recall_at_10_diff1": 0.10337,
"nauc_recall_at_20_max": 0.256518,
"nauc_recall_at_20_std": 0.243799,
"nauc_recall_at_20_diff1": 0.075321,
"nauc_recall_at_100_max": 0.313317,
"nauc_recall_at_100_std": 0.347707,
"nauc_recall_at_100_diff1": -0.177808,
"nauc_recall_at_1000_max": 0.234765,
"nauc_recall_at_1000_std": 0.321663,
"nauc_recall_at_1000_diff1": -0.046929,
"nauc_precision_at_1_max": 0.181597,
"nauc_precision_at_1_std": 0.14798,
"nauc_precision_at_1_diff1": 0.293339,
"nauc_precision_at_3_max": 0.013197,
"nauc_precision_at_3_std": 0.089997,
"nauc_precision_at_3_diff1": 0.20392,
"nauc_precision_at_5_max": 0.158655,
"nauc_precision_at_5_std": 0.171949,
"nauc_precision_at_5_diff1": 0.198834,
"nauc_precision_at_10_max": 0.170825,
"nauc_precision_at_10_std": 0.252723,
"nauc_precision_at_10_diff1": -0.090663,
"nauc_precision_at_20_max": 0.170508,
"nauc_precision_at_20_std": 0.289597,
"nauc_precision_at_20_diff1": -0.141886,
"nauc_precision_at_100_max": 0.108359,
"nauc_precision_at_100_std": 0.283899,
"nauc_precision_at_100_diff1": -0.337731,
"nauc_precision_at_1000_max": -0.109028,
"nauc_precision_at_1000_std": 0.059062,
"nauc_precision_at_1000_diff1": -0.236173,
"nauc_mrr_at_1_max": 0.181597,
"nauc_mrr_at_1_std": 0.14798,
"nauc_mrr_at_1_diff1": 0.293339,
"nauc_mrr_at_3_max": 0.119709,
"nauc_mrr_at_3_std": 0.136809,
"nauc_mrr_at_3_diff1": 0.272488,
"nauc_mrr_at_5_max": 0.184851,
"nauc_mrr_at_5_std": 0.173771,
"nauc_mrr_at_5_diff1": 0.263908,
"nauc_mrr_at_10_max": 0.18718,
"nauc_mrr_at_10_std": 0.166671,
"nauc_mrr_at_10_diff1": 0.250674,
"nauc_mrr_at_20_max": 0.182102,
"nauc_mrr_at_20_std": 0.171275,
"nauc_mrr_at_20_diff1": 0.251402,
"nauc_mrr_at_100_max": 0.181413,
"nauc_mrr_at_100_std": 0.169804,
"nauc_mrr_at_100_diff1": 0.252159,
"nauc_mrr_at_1000_max": 0.181364,
"nauc_mrr_at_1000_std": 0.169728,
"nauc_mrr_at_1000_diff1": 0.25234,
"main_score": 0.30643,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 7762.315868854523,
"evaluation_time": 28.609407663345337,
"kg_co2_emissions": null
}
Loading
Loading