Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -0,0 +1,95 @@
{
"dataset_revision": "e8379541af4e31359cca9fbcf4b00f2671dba205",
"task_name": "AmazonCounterfactualClassification",
"mteb_version": "1.31.2",
"scores": {
"test": [
{
"accuracy": 0.969552,
"f1": 0.953324,
"f1_weighted": 0.970082,
"ap": 0.865487,
"ap_weighted": 0.865487,
"scores_per_experiment": [
{
"accuracy": 0.974627,
"f1": 0.960898,
"f1_weighted": 0.975007,
"ap": 0.885243,
"ap_weighted": 0.885243
},
{
"accuracy": 0.968657,
"f1": 0.951959,
"f1_weighted": 0.969206,
"ap": 0.860985,
"ap_weighted": 0.860985
},
{
"accuracy": 0.970149,
"f1": 0.953358,
"f1_weighted": 0.9704,
"ap": 0.867193,
"ap_weighted": 0.867193
},
{
"accuracy": 0.973134,
"f1": 0.958711,
"f1_weighted": 0.973571,
"ap": 0.879084,
"ap_weighted": 0.879084
},
{
"accuracy": 0.968657,
"f1": 0.951432,
"f1_weighted": 0.969045,
"ap": 0.860918,
"ap_weighted": 0.860918
},
{
"accuracy": 0.974627,
"f1": 0.960683,
"f1_weighted": 0.974941,
"ap": 0.885414,
"ap_weighted": 0.885414
},
{
"accuracy": 0.973134,
"f1": 0.958255,
"f1_weighted": 0.973432,
"ap": 0.879339,
"ap_weighted": 0.879339
},
{
"accuracy": 0.977612,
"f1": 0.965116,
"f1_weighted": 0.97783,
"ap": 0.89816,
"ap_weighted": 0.89816
},
{
"accuracy": 0.956716,
"f1": 0.935379,
"f1_weighted": 0.957991,
"ap": 0.816612,
"ap_weighted": 0.816612
},
{
"accuracy": 0.958209,
"f1": 0.937447,
"f1_weighted": 0.959392,
"ap": 0.82192,
"ap_weighted": 0.82192
}
],
"main_score": 0.969552,
"hf_subset": "en",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 41.224671602249146,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
{
"dataset_revision": "0bbdb47bcbe3a90093699aefeed338a0f28a7ee8",
"task_name": "ArXivHierarchicalClusteringP2P",
"mteb_version": "1.31.2",
"scores": {
"test": [
{
"v_measures": {
"Level 0": [
0.734627,
0.692796,
0.674868,
0.688748,
0.65051,
0.665281,
0.712468,
0.730769,
0.662646,
0.709435
],
"Level 1": [
0.617987,
0.579289,
0.609534,
0.593757,
0.592276,
0.600809,
0.58152,
0.592046,
0.608279,
0.605467
]
},
"v_measure": 0.645156,
"v_measure_std": 0.051646,
"main_score": 0.645156,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 14.439682960510254,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
{
"dataset_revision": "b73bd54100e5abfa6e3a23dcafb46fe4d2438dc3",
"task_name": "ArXivHierarchicalClusteringS2S",
"mteb_version": "1.31.2",
"scores": {
"test": [
{
"v_measures": {
"Level 0": [
0.676202,
0.678907,
0.683023,
0.668376,
0.707832,
0.681361,
0.641119,
0.721545,
0.712057,
0.698236
],
"Level 1": [
0.589873,
0.619368,
0.600436,
0.614185,
0.587109,
0.59567,
0.604972,
0.601508,
0.587307,
0.605132
]
},
"v_measure": 0.643711,
"v_measure_std": 0.046575,
"main_score": 0.643711,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 13.052504301071167,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,158 @@
{
"dataset_revision": "c22ab2a51041ffd869aaddef7af8d8215647e41a",
"task_name": "ArguAna",
"mteb_version": "1.31.2",
"scores": {
"test": [
{
"ndcg_at_1": 0.55548,
"ndcg_at_3": 0.72962,
"ndcg_at_5": 0.76139,
"ndcg_at_10": 0.77873,
"ndcg_at_20": 0.7831,
"ndcg_at_100": 0.7831,
"ndcg_at_1000": 0.7831,
"map_at_1": 0.55548,
"map_at_3": 0.68789,
"map_at_5": 0.7056,
"map_at_10": 0.71281,
"map_at_20": 0.71413,
"map_at_100": 0.71413,
"map_at_1000": 0.71413,
"recall_at_1": 0.55548,
"recall_at_3": 0.84993,
"recall_at_5": 0.92674,
"recall_at_10": 0.98009,
"recall_at_20": 0.99644,
"recall_at_100": 0.99644,
"recall_at_1000": 0.99644,
"precision_at_1": 0.55548,
"precision_at_3": 0.28331,
"precision_at_5": 0.18535,
"precision_at_10": 0.09801,
"precision_at_20": 0.04982,
"precision_at_100": 0.00996,
"precision_at_1000": 0.001,
"mrr_at_1": 0.559033,
"mrr_at_3": 0.689426,
"mrr_at_5": 0.706994,
"mrr_at_10": 0.714324,
"mrr_at_20": 0.715647,
"mrr_at_100": 0.715647,
"mrr_at_1000": 0.715647,
"nauc_ndcg_at_1_max": -0.209535,
"nauc_ndcg_at_1_std": -0.242867,
"nauc_ndcg_at_1_diff1": 0.326084,
"nauc_ndcg_at_3_max": -0.188653,
"nauc_ndcg_at_3_std": -0.273796,
"nauc_ndcg_at_3_diff1": 0.30745,
"nauc_ndcg_at_5_max": -0.188827,
"nauc_ndcg_at_5_std": -0.266878,
"nauc_ndcg_at_5_diff1": 0.298944,
"nauc_ndcg_at_10_max": -0.201498,
"nauc_ndcg_at_10_std": -0.263769,
"nauc_ndcg_at_10_diff1": 0.295597,
"nauc_ndcg_at_20_max": -0.197053,
"nauc_ndcg_at_20_std": -0.254431,
"nauc_ndcg_at_20_diff1": 0.303115,
"nauc_ndcg_at_100_max": -0.197053,
"nauc_ndcg_at_100_std": -0.254431,
"nauc_ndcg_at_100_diff1": 0.303115,
"nauc_ndcg_at_1000_max": -0.197053,
"nauc_ndcg_at_1000_std": -0.254431,
"nauc_ndcg_at_1000_diff1": 0.303115,
"nauc_map_at_1_max": -0.209535,
"nauc_map_at_1_std": -0.242867,
"nauc_map_at_1_diff1": 0.326084,
"nauc_map_at_3_max": -0.196622,
"nauc_map_at_3_std": -0.263645,
"nauc_map_at_3_diff1": 0.308777,
"nauc_map_at_5_max": -0.197007,
"nauc_map_at_5_std": -0.25924,
"nauc_map_at_5_diff1": 0.304622,
"nauc_map_at_10_max": -0.201492,
"nauc_map_at_10_std": -0.258659,
"nauc_map_at_10_diff1": 0.304005,
"nauc_map_at_20_max": -0.200505,
"nauc_map_at_20_std": -0.256572,
"nauc_map_at_20_diff1": 0.30579,
"nauc_map_at_100_max": -0.200505,
"nauc_map_at_100_std": -0.256572,
"nauc_map_at_100_diff1": 0.30579,
"nauc_map_at_1000_max": -0.200505,
"nauc_map_at_1000_std": -0.256572,
"nauc_map_at_1000_diff1": 0.30579,
"nauc_recall_at_1_max": -0.209535,
"nauc_recall_at_1_std": -0.242867,
"nauc_recall_at_1_diff1": 0.326084,
"nauc_recall_at_3_max": -0.147861,
"nauc_recall_at_3_std": -0.324772,
"nauc_recall_at_3_diff1": 0.304131,
"nauc_recall_at_5_max": -0.113058,
"nauc_recall_at_5_std": -0.336329,
"nauc_recall_at_5_diff1": 0.250982,
"nauc_recall_at_10_max": -0.245492,
"nauc_recall_at_10_std": -0.397657,
"nauc_recall_at_10_diff1": 0.014255,
"nauc_recall_at_20_max": 0.370551,
"nauc_recall_at_20_std": 0.713396,
"nauc_recall_at_20_diff1": 0.076531,
"nauc_recall_at_100_max": 0.370551,
"nauc_recall_at_100_std": 0.713396,
"nauc_recall_at_100_diff1": 0.076531,
"nauc_recall_at_1000_max": 0.370551,
"nauc_recall_at_1000_std": 0.713396,
"nauc_recall_at_1000_diff1": 0.076531,
"nauc_precision_at_1_max": -0.209535,
"nauc_precision_at_1_std": -0.242867,
"nauc_precision_at_1_diff1": 0.326084,
"nauc_precision_at_3_max": -0.147861,
"nauc_precision_at_3_std": -0.324772,
"nauc_precision_at_3_diff1": 0.304131,
"nauc_precision_at_5_max": -0.113058,
"nauc_precision_at_5_std": -0.336329,
"nauc_precision_at_5_diff1": 0.250982,
"nauc_precision_at_10_max": -0.245492,
"nauc_precision_at_10_std": -0.397657,
"nauc_precision_at_10_diff1": 0.014255,
"nauc_precision_at_20_max": 0.370551,
"nauc_precision_at_20_std": 0.713396,
"nauc_precision_at_20_diff1": 0.076531,
"nauc_precision_at_100_max": 0.370551,
"nauc_precision_at_100_std": 0.713396,
"nauc_precision_at_100_diff1": 0.076531,
"nauc_precision_at_1000_max": 0.370551,
"nauc_precision_at_1000_std": 0.713396,
"nauc_precision_at_1000_diff1": 0.076531,
"nauc_mrr_at_1_max": -0.215027,
"nauc_mrr_at_1_std": -0.245771,
"nauc_mrr_at_1_diff1": 0.316544,
"nauc_mrr_at_3_max": -0.203939,
"nauc_mrr_at_3_std": -0.266166,
"nauc_mrr_at_3_diff1": 0.298534,
"nauc_mrr_at_5_max": -0.204936,
"nauc_mrr_at_5_std": -0.261841,
"nauc_mrr_at_5_diff1": 0.292964,
"nauc_mrr_at_10_max": -0.208877,
"nauc_mrr_at_10_std": -0.260564,
"nauc_mrr_at_10_diff1": 0.293042,
"nauc_mrr_at_20_max": -0.207931,
"nauc_mrr_at_20_std": -0.258485,
"nauc_mrr_at_20_diff1": 0.294766,
"nauc_mrr_at_100_max": -0.207931,
"nauc_mrr_at_100_std": -0.258485,
"nauc_mrr_at_100_diff1": 0.294766,
"nauc_mrr_at_1000_max": -0.207931,
"nauc_mrr_at_1000_std": -0.258485,
"nauc_mrr_at_1000_diff1": 0.294766,
"main_score": 0.77873,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 189.00718069076538,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
{
"dataset_revision": "2000358ca161889fa9c082cb41daa8dcfb161a54",
"task_name": "AskUbuntuDupQuestions",
"mteb_version": "1.31.2",
"scores": {
"test": [
{
"map": 0.64535,
"mrr": 0.766876,
"nAUC_map_max": 0.235344,
"nAUC_map_std": 0.209714,
"nAUC_map_diff1": 0.168035,
"nAUC_mrr_max": 0.367769,
"nAUC_mrr_std": 0.276248,
"nAUC_mrr_diff1": 0.210136,
"main_score": 0.64535,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 39.275365591049194,
"kg_co2_emissions": null
}
Loading
Loading