Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -0,0 +1,95 @@
{
"dataset_revision": "e8379541af4e31359cca9fbcf4b00f2671dba205",
"task_name": "AmazonCounterfactualClassification",
"mteb_version": "1.34.11",
"scores": {
"test": [
{
"accuracy": 0.931791,
"f1": 0.895685,
"f1_weighted": 0.933042,
"ap": 0.722907,
"ap_weighted": 0.722907,
"scores_per_experiment": [
{
"accuracy": 0.931343,
"f1": 0.893906,
"f1_weighted": 0.932284,
"ap": 0.718166,
"ap_weighted": 0.718166
},
{
"accuracy": 0.937313,
"f1": 0.903658,
"f1_weighted": 0.938333,
"ap": 0.740693,
"ap_weighted": 0.740693
},
{
"accuracy": 0.932836,
"f1": 0.894164,
"f1_weighted": 0.933122,
"ap": 0.720645,
"ap_weighted": 0.720645
},
{
"accuracy": 0.938806,
"f1": 0.906708,
"f1_weighted": 0.940031,
"ap": 0.747417,
"ap_weighted": 0.747417
},
{
"accuracy": 0.937313,
"f1": 0.904176,
"f1_weighted": 0.938491,
"ap": 0.741559,
"ap_weighted": 0.741559
},
{
"accuracy": 0.931343,
"f1": 0.891503,
"f1_weighted": 0.93154,
"ap": 0.714751,
"ap_weighted": 0.714751
},
{
"accuracy": 0.938806,
"f1": 0.904651,
"f1_weighted": 0.939402,
"ap": 0.744258,
"ap_weighted": 0.744258
},
{
"accuracy": 0.937313,
"f1": 0.9015,
"f1_weighted": 0.937668,
"ap": 0.73766,
"ap_weighted": 0.73766
},
{
"accuracy": 0.920896,
"f1": 0.884811,
"f1_weighted": 0.924071,
"ap": 0.696409,
"ap_weighted": 0.696409
},
{
"accuracy": 0.91194,
"f1": 0.87177,
"f1_weighted": 0.915475,
"ap": 0.667513,
"ap_weighted": 0.667513
}
],
"main_score": 0.931791,
"hf_subset": "en",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 30.505733251571655,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
{
"dataset_revision": "0bbdb47bcbe3a90093699aefeed338a0f28a7ee8",
"task_name": "ArXivHierarchicalClusteringP2P",
"mteb_version": "1.34.11",
"scores": {
"test": [
{
"v_measures": {
"Level 0": [
0.702775,
0.68422,
0.704026,
0.688488,
0.673975,
0.690276,
0.711358,
0.705818,
0.663107,
0.696268
],
"Level 1": [
0.624535,
0.620938,
0.628675,
0.623568,
0.626589,
0.62843,
0.598491,
0.646755,
0.583919,
0.602664
]
},
"v_measure": 0.655244,
"v_measure_std": 0.040079,
"main_score": 0.655244,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 51.523176193237305,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
{
"dataset_revision": "b73bd54100e5abfa6e3a23dcafb46fe4d2438dc3",
"task_name": "ArXivHierarchicalClusteringS2S",
"mteb_version": "1.34.11",
"scores": {
"test": [
{
"v_measures": {
"Level 0": [
0.685815,
0.686635,
0.681438,
0.685412,
0.682867,
0.636021,
0.688174,
0.646933,
0.666273,
0.72283
],
"Level 1": [
0.614995,
0.604606,
0.577928,
0.604655,
0.59662,
0.61032,
0.603059,
0.594826,
0.600726,
0.603144
]
},
"v_measure": 0.639664,
"v_measure_std": 0.042352,
"main_score": 0.639664,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 22.7478187084198,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,158 @@
{
"dataset_revision": "c22ab2a51041ffd869aaddef7af8d8215647e41a",
"task_name": "ArguAna",
"mteb_version": "1.34.11",
"scores": {
"test": [
{
"ndcg_at_1": 0.72688,
"ndcg_at_3": 0.8491,
"ndcg_at_5": 0.86391,
"ndcg_at_10": 0.86948,
"ndcg_at_20": 0.87259,
"ndcg_at_100": 0.87301,
"ndcg_at_1000": 0.87301,
"map_at_1": 0.72688,
"map_at_3": 0.82101,
"map_at_5": 0.82933,
"map_at_10": 0.83165,
"map_at_20": 0.83253,
"map_at_100": 0.8326,
"map_at_1000": 0.8326,
"recall_at_1": 0.72688,
"recall_at_3": 0.92959,
"recall_at_5": 0.96515,
"recall_at_10": 0.98222,
"recall_at_20": 0.99431,
"recall_at_100": 0.99644,
"recall_at_1000": 0.99644,
"precision_at_1": 0.72688,
"precision_at_3": 0.30986,
"precision_at_5": 0.19303,
"precision_at_10": 0.09822,
"precision_at_20": 0.04972,
"precision_at_100": 0.00996,
"precision_at_1000": 0.001,
"mrr_at_1": 0.72973,
"mrr_at_3": 0.822191,
"mrr_at_5": 0.830299,
"mrr_at_10": 0.832622,
"mrr_at_20": 0.833507,
"mrr_at_100": 0.833574,
"mrr_at_1000": 0.833574,
"nauc_ndcg_at_1_max": 0.243558,
"nauc_ndcg_at_1_std": -0.312009,
"nauc_ndcg_at_1_diff1": 0.730076,
"nauc_ndcg_at_3_max": 0.311855,
"nauc_ndcg_at_3_std": -0.362613,
"nauc_ndcg_at_3_diff1": 0.673429,
"nauc_ndcg_at_5_max": 0.299501,
"nauc_ndcg_at_5_std": -0.360145,
"nauc_ndcg_at_5_diff1": 0.682702,
"nauc_ndcg_at_10_max": 0.288488,
"nauc_ndcg_at_10_std": -0.366102,
"nauc_ndcg_at_10_diff1": 0.687584,
"nauc_ndcg_at_20_max": 0.284189,
"nauc_ndcg_at_20_std": -0.346913,
"nauc_ndcg_at_20_diff1": 0.690641,
"nauc_ndcg_at_100_max": 0.287804,
"nauc_ndcg_at_100_std": -0.341777,
"nauc_ndcg_at_100_diff1": 0.689867,
"nauc_ndcg_at_1000_max": 0.287804,
"nauc_ndcg_at_1000_std": -0.341777,
"nauc_ndcg_at_1000_diff1": 0.689867,
"nauc_map_at_1_max": 0.243558,
"nauc_map_at_1_std": -0.312009,
"nauc_map_at_1_diff1": 0.730076,
"nauc_map_at_3_max": 0.292065,
"nauc_map_at_3_std": -0.34759,
"nauc_map_at_3_diff1": 0.68911,
"nauc_map_at_5_max": 0.285647,
"nauc_map_at_5_std": -0.345413,
"nauc_map_at_5_diff1": 0.694342,
"nauc_map_at_10_max": 0.281915,
"nauc_map_at_10_std": -0.347453,
"nauc_map_at_10_diff1": 0.696048,
"nauc_map_at_20_max": 0.280929,
"nauc_map_at_20_std": -0.343394,
"nauc_map_at_20_diff1": 0.696798,
"nauc_map_at_100_max": 0.281325,
"nauc_map_at_100_std": -0.342773,
"nauc_map_at_100_diff1": 0.696715,
"nauc_map_at_1000_max": 0.281325,
"nauc_map_at_1000_std": -0.342773,
"nauc_map_at_1000_diff1": 0.696715,
"nauc_recall_at_1_max": 0.243558,
"nauc_recall_at_1_std": -0.312009,
"nauc_recall_at_1_diff1": 0.730076,
"nauc_recall_at_3_max": 0.438901,
"nauc_recall_at_3_std": -0.459475,
"nauc_recall_at_3_diff1": 0.573613,
"nauc_recall_at_5_max": 0.459225,
"nauc_recall_at_5_std": -0.541884,
"nauc_recall_at_5_diff1": 0.547067,
"nauc_recall_at_10_max": 0.38513,
"nauc_recall_at_10_std": -0.823475,
"nauc_recall_at_10_diff1": 0.519102,
"nauc_recall_at_20_max": 0.255742,
"nauc_recall_at_20_std": -0.249581,
"nauc_recall_at_20_diff1": 0.39402,
"nauc_recall_at_100_max": 0.845472,
"nauc_recall_at_100_std": 0.643885,
"nauc_recall_at_100_diff1": 0.085991,
"nauc_recall_at_1000_max": 0.845472,
"nauc_recall_at_1000_std": 0.643885,
"nauc_recall_at_1000_diff1": 0.085991,
"nauc_precision_at_1_max": 0.243558,
"nauc_precision_at_1_std": -0.312009,
"nauc_precision_at_1_diff1": 0.730076,
"nauc_precision_at_3_max": 0.438901,
"nauc_precision_at_3_std": -0.459475,
"nauc_precision_at_3_diff1": 0.573613,
"nauc_precision_at_5_max": 0.459225,
"nauc_precision_at_5_std": -0.541884,
"nauc_precision_at_5_diff1": 0.547067,
"nauc_precision_at_10_max": 0.38513,
"nauc_precision_at_10_std": -0.823475,
"nauc_precision_at_10_diff1": 0.519102,
"nauc_precision_at_20_max": 0.255742,
"nauc_precision_at_20_std": -0.249581,
"nauc_precision_at_20_diff1": 0.39402,
"nauc_precision_at_100_max": 0.845472,
"nauc_precision_at_100_std": 0.643885,
"nauc_precision_at_100_diff1": 0.085991,
"nauc_precision_at_1000_max": 0.845472,
"nauc_precision_at_1000_std": 0.643885,
"nauc_precision_at_1000_diff1": 0.085991,
"nauc_mrr_at_1_max": 0.235308,
"nauc_mrr_at_1_std": -0.321152,
"nauc_mrr_at_1_diff1": 0.724418,
"nauc_mrr_at_3_max": 0.284107,
"nauc_mrr_at_3_std": -0.353853,
"nauc_mrr_at_3_diff1": 0.681045,
"nauc_mrr_at_5_max": 0.277606,
"nauc_mrr_at_5_std": -0.351775,
"nauc_mrr_at_5_diff1": 0.686305,
"nauc_mrr_at_10_max": 0.273734,
"nauc_mrr_at_10_std": -0.353614,
"nauc_mrr_at_10_diff1": 0.687894,
"nauc_mrr_at_20_max": 0.272695,
"nauc_mrr_at_20_std": -0.349574,
"nauc_mrr_at_20_diff1": 0.688599,
"nauc_mrr_at_100_max": 0.27309,
"nauc_mrr_at_100_std": -0.348953,
"nauc_mrr_at_100_diff1": 0.688512,
"nauc_mrr_at_1000_max": 0.27309,
"nauc_mrr_at_1000_std": -0.348953,
"nauc_mrr_at_1000_diff1": 0.688512,
"main_score": 0.86948,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 165.33597445487976,
"kg_co2_emissions": null
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
{
"dataset_revision": "2000358ca161889fa9c082cb41daa8dcfb161a54",
"task_name": "AskUbuntuDupQuestions",
"mteb_version": "1.34.11",
"scores": {
"test": [
{
"map": 0.656017,
"mrr": 0.777064,
"nAUC_map_max": 0.269237,
"nAUC_map_std": 0.236735,
"nAUC_map_diff1": 0.146193,
"nAUC_mrr_max": 0.418508,
"nAUC_mrr_std": 0.292988,
"nAUC_mrr_diff1": 0.219584,
"main_score": 0.656017,
"hf_subset": "default",
"languages": [
"eng-Latn"
]
}
]
},
"evaluation_time": 31.883575677871704,
"kg_co2_emissions": null
}
Loading
Loading