From 49947498835ca4109f04355e93d6e1569deceae5 Mon Sep 17 00:00:00 2001 From: Isaac Chung Date: Sun, 16 Feb 2025 16:22:40 +0000 Subject: [PATCH 1/3] add most image classification descr stats --- .../Image/ImageClassification/CIFAR10.json | 44 ++ .../Image/ImageClassification/CIFAR100.json | 314 +++++++++ .../Image/ImageClassification/Caltech101.json | 320 +++++++++ .../Image/ImageClassification/Country211.json | 647 ++++++++++++++++++ .../Image/ImageClassification/DTD.json | 155 +++++ .../Image/ImageClassification/EuroSAT.json | 44 ++ .../Image/ImageClassification/FER2013.json | 35 + .../ImageClassification/FGVCAircraft.json | 314 +++++++++ .../Food101Classification.json | 317 +++++++++ .../Image/ImageClassification/GTSRB.json | 143 ++++ .../OxfordFlowersClassification.json | 320 +++++++++ .../Image/ImageClassification/OxfordPets.json | 125 ++++ .../ImageClassification/PatchCamelyon.json | 20 + .../Image/ImageClassification/RESISC45.json | 149 ++++ .../Image/ImageClassification/STL10.json | 44 ++ .../ImageClassification/StanfordCars.json | 602 ++++++++++++++++ mteb/encoder_interface.py | 46 +- mteb/models/lens_models.py | 1 - 18 files changed, 3638 insertions(+), 2 deletions(-) create mode 100644 mteb/descriptive_stats/Image/ImageClassification/CIFAR10.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/CIFAR100.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/Caltech101.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/Country211.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/DTD.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/EuroSAT.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/FER2013.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/FGVCAircraft.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/Food101Classification.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/GTSRB.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/OxfordFlowersClassification.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/OxfordPets.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/PatchCamelyon.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/RESISC45.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/STL10.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/StanfordCars.json diff --git a/mteb/descriptive_stats/Image/ImageClassification/CIFAR10.json b/mteb/descriptive_stats/Image/ImageClassification/CIFAR10.json new file mode 100644 index 0000000000..34ff70e050 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/CIFAR10.json @@ -0,0 +1,44 @@ +{ + "test": { + "num_samples": 10000, + "unique_num_labels": 10, + "min_image_width": 32, + "average_image_width": 32.0, + "max_image_width": 32, + "min_image_height": 32, + "average_image_height": 32.0, + "max_image_height": 32, + "labels": { + "3": { + "count": 1000 + }, + "8": { + "count": 1000 + }, + "0": { + "count": 1000 + }, + "6": { + "count": 1000 + }, + "1": { + "count": 1000 + }, + "9": { + "count": 1000 + }, + "5": { + "count": 1000 + }, + "7": { + "count": 1000 + }, + "4": { + "count": 1000 + }, + "2": { + "count": 1000 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/CIFAR100.json b/mteb/descriptive_stats/Image/ImageClassification/CIFAR100.json new file mode 100644 index 0000000000..e8a282bc67 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/CIFAR100.json @@ -0,0 +1,314 @@ +{ + "test": { + "num_samples": 10000, + "unique_num_labels": 100, + "min_image_width": 32, + "average_image_width": 32.0, + "max_image_width": 32, + "min_image_height": 32, + "average_image_height": 32.0, + "max_image_height": 32, + "labels": { + "49": { + "count": 100 + }, + "33": { + "count": 100 + }, + "72": { + "count": 100 + }, + "51": { + "count": 100 + }, + "71": { + "count": 100 + }, + "92": { + "count": 100 + }, + "15": { + "count": 100 + }, + "14": { + "count": 100 + }, + "23": { + "count": 100 + }, + "0": { + "count": 100 + }, + "75": { + "count": 100 + }, + "81": { + "count": 100 + }, + "69": { + "count": 100 + }, + "40": { + "count": 100 + }, + "43": { + "count": 100 + }, + "97": { + "count": 100 + }, + "70": { + "count": 100 + }, + "53": { + "count": 100 + }, + "29": { + "count": 100 + }, + "21": { + "count": 100 + }, + "16": { + "count": 100 + }, + "39": { + "count": 100 + }, + "8": { + "count": 100 + }, + "20": { + "count": 100 + }, + "61": { + "count": 100 + }, + "41": { + "count": 100 + }, + "93": { + "count": 100 + }, + "56": { + "count": 100 + }, + "73": { + "count": 100 + }, + "58": { + "count": 100 + }, + "11": { + "count": 100 + }, + "25": { + "count": 100 + }, + "37": { + "count": 100 + }, + "63": { + "count": 100 + }, + "24": { + "count": 100 + }, + "22": { + "count": 100 + }, + "17": { + "count": 100 + }, + "4": { + "count": 100 + }, + "6": { + "count": 100 + }, + "9": { + "count": 100 + }, + "57": { + "count": 100 + }, + "2": { + "count": 100 + }, + "32": { + "count": 100 + }, + "52": { + "count": 100 + }, + "42": { + "count": 100 + }, + "77": { + "count": 100 + }, + "27": { + "count": 100 + }, + "65": { + "count": 100 + }, + "7": { + "count": 100 + }, + "35": { + "count": 100 + }, + "82": { + "count": 100 + }, + "66": { + "count": 100 + }, + "90": { + "count": 100 + }, + "67": { + "count": 100 + }, + "91": { + "count": 100 + }, + "10": { + "count": 100 + }, + "78": { + "count": 100 + }, + "54": { + "count": 100 + }, + "89": { + "count": 100 + }, + "18": { + "count": 100 + }, + "13": { + "count": 100 + }, + "50": { + "count": 100 + }, + "26": { + "count": 100 + }, + "83": { + "count": 100 + }, + "47": { + "count": 100 + }, + "95": { + "count": 100 + }, + "76": { + "count": 100 + }, + "59": { + "count": 100 + }, + "85": { + "count": 100 + }, + "19": { + "count": 100 + }, + "46": { + "count": 100 + }, + "1": { + "count": 100 + }, + "74": { + "count": 100 + }, + "60": { + "count": 100 + }, + "64": { + "count": 100 + }, + "45": { + "count": 100 + }, + "36": { + "count": 100 + }, + "87": { + "count": 100 + }, + "30": { + "count": 100 + }, + "99": { + "count": 100 + }, + "80": { + "count": 100 + }, + "28": { + "count": 100 + }, + "98": { + "count": 100 + }, + "12": { + "count": 100 + }, + "94": { + "count": 100 + }, + "68": { + "count": 100 + }, + "44": { + "count": 100 + }, + "31": { + "count": 100 + }, + "79": { + "count": 100 + }, + "34": { + "count": 100 + }, + "55": { + "count": 100 + }, + "62": { + "count": 100 + }, + "96": { + "count": 100 + }, + "84": { + "count": 100 + }, + "38": { + "count": 100 + }, + "86": { + "count": 100 + }, + "5": { + "count": 100 + }, + "48": { + "count": 100 + }, + "3": { + "count": 100 + }, + "88": { + "count": 100 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/Caltech101.json b/mteb/descriptive_stats/Image/ImageClassification/Caltech101.json new file mode 100644 index 0000000000..3d94eab4ca --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/Caltech101.json @@ -0,0 +1,320 @@ +{ + "test": { + "num_samples": 6084, + "unique_num_labels": 102, + "min_image_width": 80, + "average_image_width": 311.7217291255753, + "max_image_width": 3481, + "min_image_height": 101, + "average_image_height": 241.84418145956607, + "max_image_height": 3999, + "labels": { + "4": { + "count": 437 + }, + "37": { + "count": 405 + }, + "38": { + "count": 405 + }, + "57": { + "count": 170 + }, + "66": { + "count": 768 + }, + "0": { + "count": 25 + }, + "1": { + "count": 770 + }, + "2": { + "count": 12 + }, + "3": { + "count": 12 + }, + "5": { + "count": 17 + }, + "6": { + "count": 24 + }, + "7": { + "count": 16 + }, + "8": { + "count": 3 + }, + "9": { + "count": 98 + }, + "10": { + "count": 68 + }, + "11": { + "count": 13 + }, + "12": { + "count": 55 + }, + "13": { + "count": 61 + }, + "14": { + "count": 20 + }, + "15": { + "count": 13 + }, + "16": { + "count": 93 + }, + "17": { + "count": 17 + }, + "18": { + "count": 29 + }, + "19": { + "count": 32 + }, + "20": { + "count": 77 + }, + "22": { + "count": 39 + }, + "23": { + "count": 43 + }, + "24": { + "count": 40 + }, + "25": { + "count": 20 + }, + "26": { + "count": 21 + }, + "27": { + "count": 27 + }, + "28": { + "count": 37 + }, + "29": { + "count": 22 + }, + "30": { + "count": 35 + }, + "31": { + "count": 38 + }, + "32": { + "count": 45 + }, + "33": { + "count": 34 + }, + "34": { + "count": 23 + }, + "35": { + "count": 34 + }, + "36": { + "count": 55 + }, + "39": { + "count": 37 + }, + "40": { + "count": 37 + }, + "41": { + "count": 15 + }, + "42": { + "count": 4 + }, + "43": { + "count": 4 + }, + "44": { + "count": 21 + }, + "45": { + "count": 69 + }, + "46": { + "count": 70 + }, + "47": { + "count": 12 + }, + "48": { + "count": 24 + }, + "49": { + "count": 58 + }, + "50": { + "count": 50 + }, + "51": { + "count": 1 + }, + "52": { + "count": 34 + }, + "53": { + "count": 56 + }, + "54": { + "count": 84 + }, + "55": { + "count": 31 + }, + "56": { + "count": 51 + }, + "58": { + "count": 48 + }, + "59": { + "count": 11 + }, + "60": { + "count": 36 + }, + "61": { + "count": 13 + }, + "62": { + "count": 10 + }, + "63": { + "count": 57 + }, + "64": { + "count": 2 + }, + "65": { + "count": 46 + }, + "67": { + "count": 25 + }, + "68": { + "count": 5 + }, + "69": { + "count": 9 + }, + "70": { + "count": 17 + }, + "71": { + "count": 8 + }, + "72": { + "count": 15 + }, + "73": { + "count": 23 + }, + "74": { + "count": 4 + }, + "75": { + "count": 27 + }, + "76": { + "count": 52 + }, + "77": { + "count": 29 + }, + "78": { + "count": 19 + }, + "79": { + "count": 10 + }, + "80": { + "count": 33 + }, + "81": { + "count": 9 + }, + "82": { + "count": 54 + }, + "83": { + "count": 27 + }, + "84": { + "count": 5 + }, + "85": { + "count": 34 + }, + "86": { + "count": 15 + }, + "87": { + "count": 56 + }, + "88": { + "count": 29 + }, + "89": { + "count": 34 + }, + "90": { + "count": 5 + }, + "91": { + "count": 55 + }, + "92": { + "count": 19 + }, + "93": { + "count": 56 + }, + "94": { + "count": 45 + }, + "95": { + "count": 209 + }, + "96": { + "count": 7 + }, + "97": { + "count": 29 + }, + "98": { + "count": 4 + }, + "99": { + "count": 26 + }, + "100": { + "count": 9 + }, + "101": { + "count": 30 + }, + "21": { + "count": 17 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/Country211.json b/mteb/descriptive_stats/Image/ImageClassification/Country211.json new file mode 100644 index 0000000000..647aefea10 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/Country211.json @@ -0,0 +1,647 @@ +{ + "test": { + "num_samples": 21100, + "unique_num_labels": 211, + "min_image_width": 32, + "average_image_width": 468.5923222748815, + "max_image_width": 500, + "min_image_height": 37, + "average_image_height": 381.726682464455, + "max_image_height": 500, + "labels": { + "0": { + "count": 100 + }, + "1": { + "count": 100 + }, + "2": { + "count": 100 + }, + "3": { + "count": 100 + }, + "4": { + "count": 100 + }, + "5": { + "count": 100 + }, + "6": { + "count": 100 + }, + "7": { + "count": 100 + }, + "8": { + "count": 100 + }, + "9": { + "count": 100 + }, + "10": { + "count": 100 + }, + "11": { + "count": 100 + }, + "12": { + "count": 100 + }, + "13": { + "count": 100 + }, + "14": { + "count": 100 + }, + "15": { + "count": 100 + }, + "16": { + "count": 100 + }, + "17": { + "count": 100 + }, + "18": { + "count": 100 + }, + "19": { + "count": 100 + }, + "20": { + "count": 100 + }, + "21": { + "count": 100 + }, + "22": { + "count": 100 + }, + "23": { + "count": 100 + }, + "24": { + "count": 100 + }, + "25": { + "count": 100 + }, + "26": { + "count": 100 + }, + "27": { + "count": 100 + }, + "28": { + "count": 100 + }, + "29": { + "count": 100 + }, + "30": { + "count": 100 + }, + "31": { + "count": 100 + }, + "32": { + "count": 100 + }, + "33": { + "count": 100 + }, + "34": { + "count": 100 + }, + "35": { + "count": 100 + }, + "36": { + "count": 100 + }, + "37": { + "count": 100 + }, + "38": { + "count": 100 + }, + "39": { + "count": 100 + }, + "40": { + "count": 100 + }, + "41": { + "count": 100 + }, + "42": { + "count": 100 + }, + "43": { + "count": 100 + }, + "44": { + "count": 100 + }, + "45": { + "count": 100 + }, + "46": { + "count": 100 + }, + "47": { + "count": 100 + }, + "48": { + "count": 100 + }, + "49": { + "count": 100 + }, + "50": { + "count": 100 + }, + "51": { + "count": 100 + }, + "52": { + "count": 100 + }, + "53": { + "count": 100 + }, + "54": { + "count": 100 + }, + "55": { + "count": 100 + }, + "56": { + "count": 100 + }, + "57": { + "count": 100 + }, + "58": { + "count": 100 + }, + "59": { + "count": 100 + }, + "60": { + "count": 100 + }, + "61": { + "count": 100 + }, + "62": { + "count": 100 + }, + "63": { + "count": 100 + }, + "64": { + "count": 100 + }, + "65": { + "count": 100 + }, + "66": { + "count": 100 + }, + "67": { + "count": 100 + }, + "68": { + "count": 100 + }, + "69": { + "count": 100 + }, + "70": { + "count": 100 + }, + "71": { + "count": 100 + }, + "72": { + "count": 100 + }, + "73": { + "count": 100 + }, + "74": { + "count": 100 + }, + "75": { + "count": 100 + }, + "76": { + "count": 100 + }, + "77": { + "count": 100 + }, + "78": { + "count": 100 + }, + "79": { + "count": 100 + }, + "80": { + "count": 100 + }, + "81": { + "count": 100 + }, + "82": { + "count": 100 + }, + "83": { + "count": 100 + }, + "84": { + "count": 100 + }, + "85": { + "count": 100 + }, + "86": { + "count": 100 + }, + "87": { + "count": 100 + }, + "88": { + "count": 100 + }, + "89": { + "count": 100 + }, + "90": { + "count": 100 + }, + "91": { + "count": 100 + }, + "92": { + "count": 100 + }, + "93": { + "count": 100 + }, + "94": { + "count": 100 + }, + "95": { + "count": 100 + }, + "96": { + "count": 100 + }, + "97": { + "count": 100 + }, + "98": { + "count": 100 + }, + "99": { + "count": 100 + }, + "100": { + "count": 100 + }, + "101": { + "count": 100 + }, + "102": { + "count": 100 + }, + "103": { + "count": 100 + }, + "104": { + "count": 100 + }, + "105": { + "count": 100 + }, + "106": { + "count": 100 + }, + "107": { + "count": 100 + }, + "108": { + "count": 100 + }, + "109": { + "count": 100 + }, + "110": { + "count": 100 + }, + "111": { + "count": 100 + }, + "112": { + "count": 100 + }, + "113": { + "count": 100 + }, + "114": { + "count": 100 + }, + "115": { + "count": 100 + }, + "116": { + "count": 100 + }, + "117": { + "count": 100 + }, + "118": { + "count": 100 + }, + "119": { + "count": 100 + }, + "120": { + "count": 100 + }, + "121": { + "count": 100 + }, + "122": { + "count": 100 + }, + "123": { + "count": 100 + }, + "124": { + "count": 100 + }, + "125": { + "count": 100 + }, + "126": { + "count": 100 + }, + "127": { + "count": 100 + }, + "128": { + "count": 100 + }, + "129": { + "count": 100 + }, + "130": { + "count": 100 + }, + "131": { + "count": 100 + }, + "132": { + "count": 100 + }, + "133": { + "count": 100 + }, + "134": { + "count": 100 + }, + "135": { + "count": 100 + }, + "136": { + "count": 100 + }, + "137": { + "count": 100 + }, + "138": { + "count": 100 + }, + "139": { + "count": 100 + }, + "140": { + "count": 100 + }, + "141": { + "count": 100 + }, + "142": { + "count": 100 + }, + "143": { + "count": 100 + }, + "144": { + "count": 100 + }, + "145": { + "count": 100 + }, + "146": { + "count": 100 + }, + "147": { + "count": 100 + }, + "148": { + "count": 100 + }, + "149": { + "count": 100 + }, + "150": { + "count": 100 + }, + "151": { + "count": 100 + }, + "152": { + "count": 100 + }, + "153": { + "count": 100 + }, + "154": { + "count": 100 + }, + "155": { + "count": 100 + }, + "156": { + "count": 100 + }, + "157": { + "count": 100 + }, + "158": { + "count": 100 + }, + "159": { + "count": 100 + }, + "160": { + "count": 100 + }, + "161": { + "count": 100 + }, + "162": { + "count": 100 + }, + "163": { + "count": 100 + }, + "164": { + "count": 100 + }, + "165": { + "count": 100 + }, + "166": { + "count": 100 + }, + "167": { + "count": 100 + }, + "168": { + "count": 100 + }, + "169": { + "count": 100 + }, + "170": { + "count": 100 + }, + "171": { + "count": 100 + }, + "172": { + "count": 100 + }, + "173": { + "count": 100 + }, + "174": { + "count": 100 + }, + "175": { + "count": 100 + }, + "176": { + "count": 100 + }, + "177": { + "count": 100 + }, + "178": { + "count": 100 + }, + "179": { + "count": 100 + }, + "180": { + "count": 100 + }, + "181": { + "count": 100 + }, + "182": { + "count": 100 + }, + "183": { + "count": 100 + }, + "184": { + "count": 100 + }, + "185": { + "count": 100 + }, + "186": { + "count": 100 + }, + "187": { + "count": 100 + }, + "188": { + "count": 100 + }, + "189": { + "count": 100 + }, + "190": { + "count": 100 + }, + "191": { + "count": 100 + }, + "192": { + "count": 100 + }, + "193": { + "count": 100 + }, + "194": { + "count": 100 + }, + "195": { + "count": 100 + }, + "196": { + "count": 100 + }, + "197": { + "count": 100 + }, + "198": { + "count": 100 + }, + "199": { + "count": 100 + }, + "200": { + "count": 100 + }, + "201": { + "count": 100 + }, + "202": { + "count": 100 + }, + "203": { + "count": 100 + }, + "204": { + "count": 100 + }, + "205": { + "count": 100 + }, + "206": { + "count": 100 + }, + "207": { + "count": 100 + }, + "208": { + "count": 100 + }, + "209": { + "count": 100 + }, + "210": { + "count": 100 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/DTD.json b/mteb/descriptive_stats/Image/ImageClassification/DTD.json new file mode 100644 index 0000000000..13a6fcf10c --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/DTD.json @@ -0,0 +1,155 @@ +{ + "test": { + "num_samples": 1880, + "unique_num_labels": 47, + "min_image_width": 300, + "average_image_width": 488.9760638297872, + "max_image_width": 900, + "min_image_height": 300, + "average_image_height": 447.4962765957447, + "max_image_height": 778, + "labels": { + "0": { + "count": 40 + }, + "1": { + "count": 40 + }, + "10": { + "count": 40 + }, + "11": { + "count": 40 + }, + "12": { + "count": 40 + }, + "13": { + "count": 40 + }, + "14": { + "count": 40 + }, + "15": { + "count": 40 + }, + "16": { + "count": 40 + }, + "17": { + "count": 40 + }, + "18": { + "count": 40 + }, + "19": { + "count": 40 + }, + "2": { + "count": 40 + }, + "20": { + "count": 40 + }, + "21": { + "count": 40 + }, + "22": { + "count": 40 + }, + "23": { + "count": 40 + }, + "24": { + "count": 40 + }, + "25": { + "count": 40 + }, + "26": { + "count": 40 + }, + "27": { + "count": 40 + }, + "28": { + "count": 40 + }, + "29": { + "count": 40 + }, + "3": { + "count": 40 + }, + "30": { + "count": 40 + }, + "31": { + "count": 40 + }, + "32": { + "count": 40 + }, + "33": { + "count": 40 + }, + "34": { + "count": 40 + }, + "35": { + "count": 40 + }, + "36": { + "count": 40 + }, + "37": { + "count": 40 + }, + "38": { + "count": 40 + }, + "39": { + "count": 40 + }, + "4": { + "count": 40 + }, + "40": { + "count": 40 + }, + "41": { + "count": 40 + }, + "42": { + "count": 40 + }, + "43": { + "count": 40 + }, + "44": { + "count": 40 + }, + "45": { + "count": 40 + }, + "46": { + "count": 40 + }, + "5": { + "count": 40 + }, + "6": { + "count": 40 + }, + "7": { + "count": 40 + }, + "8": { + "count": 40 + }, + "9": { + "count": 40 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/EuroSAT.json b/mteb/descriptive_stats/Image/ImageClassification/EuroSAT.json new file mode 100644 index 0000000000..45464c8286 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/EuroSAT.json @@ -0,0 +1,44 @@ +{ + "test": { + "num_samples": 5400, + "unique_num_labels": 10, + "min_image_width": 64, + "average_image_width": 64.0, + "max_image_width": 64, + "min_image_height": 64, + "average_image_height": 64.0, + "max_image_height": 64, + "labels": { + "4": { + "count": 501 + }, + "3": { + "count": 496 + }, + "7": { + "count": 554 + }, + "2": { + "count": 573 + }, + "9": { + "count": 609 + }, + "0": { + "count": 596 + }, + "8": { + "count": 529 + }, + "1": { + "count": 608 + }, + "5": { + "count": 396 + }, + "6": { + "count": 538 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/FER2013.json b/mteb/descriptive_stats/Image/ImageClassification/FER2013.json new file mode 100644 index 0000000000..a7238cb1a5 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/FER2013.json @@ -0,0 +1,35 @@ +{ + "test": { + "num_samples": 7178, + "unique_num_labels": 7, + "min_image_width": 48, + "average_image_width": 48.0, + "max_image_width": 48, + "min_image_height": 48, + "average_image_height": 48.0, + "max_image_height": 48, + "labels": { + "0": { + "count": 958 + }, + "1": { + "count": 111 + }, + "2": { + "count": 1024 + }, + "3": { + "count": 1774 + }, + "4": { + "count": 1233 + }, + "5": { + "count": 1247 + }, + "6": { + "count": 831 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/FGVCAircraft.json b/mteb/descriptive_stats/Image/ImageClassification/FGVCAircraft.json new file mode 100644 index 0000000000..2b9f2d88b6 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/FGVCAircraft.json @@ -0,0 +1,314 @@ +{ + "test": { + "num_samples": 3333, + "unique_num_labels": 100, + "min_image_width": 800, + "average_image_width": 1098.5760576057605, + "max_image_width": 1600, + "min_image_height": 413, + "average_image_height": 746.996699669967, + "max_image_height": 1197, + "labels": { + "0": { + "count": 33 + }, + "1": { + "count": 33 + }, + "2": { + "count": 34 + }, + "3": { + "count": 33 + }, + "4": { + "count": 33 + }, + "5": { + "count": 34 + }, + "6": { + "count": 33 + }, + "7": { + "count": 33 + }, + "8": { + "count": 34 + }, + "9": { + "count": 33 + }, + "10": { + "count": 33 + }, + "11": { + "count": 34 + }, + "12": { + "count": 33 + }, + "13": { + "count": 33 + }, + "14": { + "count": 34 + }, + "15": { + "count": 33 + }, + "16": { + "count": 33 + }, + "17": { + "count": 34 + }, + "18": { + "count": 33 + }, + "19": { + "count": 33 + }, + "20": { + "count": 34 + }, + "21": { + "count": 33 + }, + "22": { + "count": 33 + }, + "23": { + "count": 34 + }, + "24": { + "count": 33 + }, + "25": { + "count": 33 + }, + "26": { + "count": 34 + }, + "27": { + "count": 33 + }, + "28": { + "count": 33 + }, + "29": { + "count": 34 + }, + "30": { + "count": 33 + }, + "31": { + "count": 33 + }, + "32": { + "count": 34 + }, + "33": { + "count": 33 + }, + "34": { + "count": 33 + }, + "35": { + "count": 34 + }, + "36": { + "count": 33 + }, + "37": { + "count": 33 + }, + "38": { + "count": 34 + }, + "39": { + "count": 33 + }, + "40": { + "count": 33 + }, + "41": { + "count": 34 + }, + "42": { + "count": 33 + }, + "43": { + "count": 33 + }, + "44": { + "count": 34 + }, + "45": { + "count": 33 + }, + "46": { + "count": 33 + }, + "47": { + "count": 34 + }, + "48": { + "count": 33 + }, + "49": { + "count": 33 + }, + "50": { + "count": 34 + }, + "51": { + "count": 33 + }, + "52": { + "count": 33 + }, + "53": { + "count": 34 + }, + "54": { + "count": 33 + }, + "55": { + "count": 33 + }, + "56": { + "count": 34 + }, + "57": { + "count": 33 + }, + "58": { + "count": 33 + }, + "59": { + "count": 34 + }, + "60": { + "count": 33 + }, + "61": { + "count": 33 + }, + "62": { + "count": 34 + }, + "63": { + "count": 33 + }, + "64": { + "count": 33 + }, + "65": { + "count": 34 + }, + "66": { + "count": 33 + }, + "67": { + "count": 33 + }, + "68": { + "count": 34 + }, + "69": { + "count": 33 + }, + "70": { + "count": 33 + }, + "71": { + "count": 34 + }, + "72": { + "count": 33 + }, + "73": { + "count": 33 + }, + "74": { + "count": 34 + }, + "75": { + "count": 33 + }, + "76": { + "count": 33 + }, + "77": { + "count": 34 + }, + "78": { + "count": 33 + }, + "79": { + "count": 33 + }, + "80": { + "count": 34 + }, + "81": { + "count": 33 + }, + "82": { + "count": 33 + }, + "83": { + "count": 34 + }, + "84": { + "count": 33 + }, + "85": { + "count": 33 + }, + "86": { + "count": 34 + }, + "87": { + "count": 33 + }, + "88": { + "count": 33 + }, + "89": { + "count": 34 + }, + "90": { + "count": 33 + }, + "91": { + "count": 33 + }, + "92": { + "count": 34 + }, + "93": { + "count": 33 + }, + "94": { + "count": 33 + }, + "95": { + "count": 34 + }, + "96": { + "count": 33 + }, + "97": { + "count": 33 + }, + "98": { + "count": 34 + }, + "99": { + "count": 33 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/Food101Classification.json b/mteb/descriptive_stats/Image/ImageClassification/Food101Classification.json new file mode 100644 index 0000000000..4137261f84 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/Food101Classification.json @@ -0,0 +1,317 @@ +{ + "validation": { + "num_samples": 25250, + "unique_num_labels": 101, + "min_image_width": 287, + "average_image_width": 495.818495049505, + "max_image_width": 512, + "min_image_height": 213, + "average_image_height": 475.08229702970294, + "max_image_height": 512, + "labels": { + "6": { + "count": 250 + }, + "79": { + "count": 250 + }, + "81": { + "count": 250 + }, + "53": { + "count": 250 + }, + "10": { + "count": 250 + }, + "20": { + "count": 250 + }, + "77": { + "count": 250 + }, + "48": { + "count": 250 + }, + "86": { + "count": 250 + }, + "84": { + "count": 250 + }, + "76": { + "count": 250 + }, + "34": { + "count": 250 + }, + "51": { + "count": 250 + }, + "21": { + "count": 250 + }, + "64": { + "count": 250 + }, + "0": { + "count": 250 + }, + "43": { + "count": 250 + }, + "44": { + "count": 250 + }, + "73": { + "count": 250 + }, + "57": { + "count": 250 + }, + "14": { + "count": 250 + }, + "5": { + "count": 250 + }, + "46": { + "count": 250 + }, + "55": { + "count": 250 + }, + "93": { + "count": 250 + }, + "98": { + "count": 250 + }, + "38": { + "count": 250 + }, + "11": { + "count": 250 + }, + "99": { + "count": 250 + }, + "72": { + "count": 250 + }, + "22": { + "count": 250 + }, + "59": { + "count": 250 + }, + "70": { + "count": 250 + }, + "16": { + "count": 250 + }, + "2": { + "count": 250 + }, + "58": { + "count": 250 + }, + "83": { + "count": 250 + }, + "96": { + "count": 250 + }, + "39": { + "count": 250 + }, + "49": { + "count": 250 + }, + "45": { + "count": 250 + }, + "88": { + "count": 250 + }, + "9": { + "count": 250 + }, + "26": { + "count": 250 + }, + "94": { + "count": 250 + }, + "4": { + "count": 250 + }, + "65": { + "count": 250 + }, + "32": { + "count": 250 + }, + "27": { + "count": 250 + }, + "36": { + "count": 250 + }, + "87": { + "count": 250 + }, + "69": { + "count": 250 + }, + "85": { + "count": 250 + }, + "25": { + "count": 250 + }, + "40": { + "count": 250 + }, + "19": { + "count": 250 + }, + "35": { + "count": 250 + }, + "56": { + "count": 250 + }, + "42": { + "count": 250 + }, + "60": { + "count": 250 + }, + "68": { + "count": 250 + }, + "100": { + "count": 250 + }, + "41": { + "count": 250 + }, + "92": { + "count": 250 + }, + "24": { + "count": 250 + }, + "3": { + "count": 250 + }, + "89": { + "count": 250 + }, + "75": { + "count": 250 + }, + "17": { + "count": 250 + }, + "97": { + "count": 250 + }, + "61": { + "count": 250 + }, + "33": { + "count": 250 + }, + "80": { + "count": 250 + }, + "30": { + "count": 250 + }, + "8": { + "count": 250 + }, + "74": { + "count": 250 + }, + "66": { + "count": 250 + }, + "31": { + "count": 250 + }, + "18": { + "count": 250 + }, + "67": { + "count": 250 + }, + "37": { + "count": 250 + }, + "13": { + "count": 250 + }, + "63": { + "count": 250 + }, + "28": { + "count": 250 + }, + "47": { + "count": 250 + }, + "52": { + "count": 250 + }, + "54": { + "count": 250 + }, + "1": { + "count": 250 + }, + "82": { + "count": 250 + }, + "91": { + "count": 250 + }, + "95": { + "count": 250 + }, + "7": { + "count": 250 + }, + "29": { + "count": 250 + }, + "78": { + "count": 250 + }, + "15": { + "count": 250 + }, + "23": { + "count": 250 + }, + "12": { + "count": 250 + }, + "62": { + "count": 250 + }, + "50": { + "count": 250 + }, + "71": { + "count": 250 + }, + "90": { + "count": 250 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/GTSRB.json b/mteb/descriptive_stats/Image/ImageClassification/GTSRB.json new file mode 100644 index 0000000000..84a5216450 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/GTSRB.json @@ -0,0 +1,143 @@ +{ + "test": { + "num_samples": 12630, + "unique_num_labels": 43, + "min_image_width": 25, + "average_image_width": 50.50775930324624, + "max_image_width": 266, + "min_image_height": 25, + "average_image_height": 50.36444972288203, + "max_image_height": 232, + "labels": { + "16": { + "count": 150 + }, + "1": { + "count": 720 + }, + "38": { + "count": 690 + }, + "33": { + "count": 210 + }, + "11": { + "count": 420 + }, + "18": { + "count": 390 + }, + "12": { + "count": 690 + }, + "25": { + "count": 480 + }, + "35": { + "count": 390 + }, + "7": { + "count": 450 + }, + "23": { + "count": 150 + }, + "4": { + "count": 660 + }, + "9": { + "count": 480 + }, + "21": { + "count": 90 + }, + "20": { + "count": 90 + }, + "27": { + "count": 60 + }, + "3": { + "count": 450 + }, + "13": { + "count": 720 + }, + "10": { + "count": 660 + }, + "5": { + "count": 630 + }, + "17": { + "count": 360 + }, + "34": { + "count": 120 + }, + "2": { + "count": 750 + }, + "8": { + "count": 450 + }, + "30": { + "count": 150 + }, + "24": { + "count": 90 + }, + "15": { + "count": 210 + }, + "26": { + "count": 180 + }, + "28": { + "count": 150 + }, + "22": { + "count": 120 + }, + "14": { + "count": 270 + }, + "32": { + "count": 60 + }, + "29": { + "count": 90 + }, + "6": { + "count": 150 + }, + "36": { + "count": 120 + }, + "40": { + "count": 90 + }, + "41": { + "count": 60 + }, + "31": { + "count": 270 + }, + "19": { + "count": 60 + }, + "0": { + "count": 60 + }, + "39": { + "count": 90 + }, + "42": { + "count": 90 + }, + "37": { + "count": 60 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/OxfordFlowersClassification.json b/mteb/descriptive_stats/Image/ImageClassification/OxfordFlowersClassification.json new file mode 100644 index 0000000000..852aadc78b --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/OxfordFlowersClassification.json @@ -0,0 +1,320 @@ +{ + "test": { + "num_samples": 1020, + "unique_num_labels": 102, + "min_image_width": 500, + "average_image_width": 618.0725490196079, + "max_image_width": 873, + "min_image_height": 500, + "average_image_height": 538.2607843137255, + "max_image_height": 928, + "labels": { + "0": { + "count": 9 + }, + "1": { + "count": 9 + }, + "2": { + "count": 10 + }, + "3": { + "count": 9 + }, + "4": { + "count": 11 + }, + "5": { + "count": 11 + }, + "6": { + "count": 10 + }, + "7": { + "count": 10 + }, + "8": { + "count": 11 + }, + "9": { + "count": 10 + }, + "10": { + "count": 10 + }, + "11": { + "count": 9 + }, + "12": { + "count": 10 + }, + "13": { + "count": 10 + }, + "14": { + "count": 10 + }, + "15": { + "count": 9 + }, + "16": { + "count": 11 + }, + "17": { + "count": 11 + }, + "18": { + "count": 10 + }, + "19": { + "count": 9 + }, + "20": { + "count": 9 + }, + "21": { + "count": 10 + }, + "22": { + "count": 11 + }, + "23": { + "count": 11 + }, + "24": { + "count": 10 + }, + "25": { + "count": 11 + }, + "26": { + "count": 10 + }, + "27": { + "count": 9 + }, + "28": { + "count": 11 + }, + "29": { + "count": 10 + }, + "30": { + "count": 10 + }, + "31": { + "count": 9 + }, + "32": { + "count": 10 + }, + "33": { + "count": 10 + }, + "34": { + "count": 10 + }, + "35": { + "count": 11 + }, + "36": { + "count": 9 + }, + "37": { + "count": 10 + }, + "38": { + "count": 10 + }, + "39": { + "count": 11 + }, + "40": { + "count": 10 + }, + "41": { + "count": 10 + }, + "42": { + "count": 11 + }, + "43": { + "count": 10 + }, + "44": { + "count": 10 + }, + "45": { + "count": 10 + }, + "46": { + "count": 10 + }, + "47": { + "count": 9 + }, + "48": { + "count": 10 + }, + "49": { + "count": 11 + }, + "50": { + "count": 10 + }, + "51": { + "count": 10 + }, + "52": { + "count": 10 + }, + "53": { + "count": 10 + }, + "54": { + "count": 10 + }, + "55": { + "count": 10 + }, + "56": { + "count": 10 + }, + "57": { + "count": 11 + }, + "58": { + "count": 10 + }, + "59": { + "count": 10 + }, + "60": { + "count": 10 + }, + "61": { + "count": 10 + }, + "62": { + "count": 9 + }, + "63": { + "count": 10 + }, + "64": { + "count": 10 + }, + "65": { + "count": 9 + }, + "66": { + "count": 11 + }, + "67": { + "count": 10 + }, + "68": { + "count": 11 + }, + "69": { + "count": 9 + }, + "70": { + "count": 9 + }, + "71": { + "count": 10 + }, + "72": { + "count": 10 + }, + "73": { + "count": 10 + }, + "74": { + "count": 10 + }, + "75": { + "count": 10 + }, + "76": { + "count": 10 + }, + "77": { + "count": 10 + }, + "78": { + "count": 9 + }, + "79": { + "count": 10 + }, + "80": { + "count": 10 + }, + "81": { + "count": 11 + }, + "82": { + "count": 10 + }, + "83": { + "count": 9 + }, + "84": { + "count": 11 + }, + "85": { + "count": 10 + }, + "86": { + "count": 10 + }, + "87": { + "count": 10 + }, + "88": { + "count": 10 + }, + "89": { + "count": 10 + }, + "90": { + "count": 10 + }, + "91": { + "count": 10 + }, + "92": { + "count": 10 + }, + "93": { + "count": 9 + }, + "94": { + "count": 9 + }, + "95": { + "count": 10 + }, + "96": { + "count": 10 + }, + "97": { + "count": 10 + }, + "98": { + "count": 10 + }, + "99": { + "count": 10 + }, + "100": { + "count": 10 + }, + "101": { + "count": 11 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/OxfordPets.json b/mteb/descriptive_stats/Image/ImageClassification/OxfordPets.json new file mode 100644 index 0000000000..0aa19204a7 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/OxfordPets.json @@ -0,0 +1,125 @@ +{ + "test": { + "num_samples": 3669, + "unique_num_labels": 37, + "min_image_width": 137, + "average_image_width": 443.4600708639956, + "max_image_width": 1646, + "min_image_height": 103, + "average_image_height": 399.3780321613519, + "max_image_height": 2160, + "labels": { + "0": { + "count": 98 + }, + "1": { + "count": 100 + }, + "2": { + "count": 100 + }, + "3": { + "count": 100 + }, + "4": { + "count": 100 + }, + "5": { + "count": 100 + }, + "6": { + "count": 100 + }, + "7": { + "count": 88 + }, + "8": { + "count": 99 + }, + "9": { + "count": 100 + }, + "10": { + "count": 100 + }, + "11": { + "count": 97 + }, + "12": { + "count": 100 + }, + "13": { + "count": 100 + }, + "14": { + "count": 100 + }, + "15": { + "count": 100 + }, + "16": { + "count": 100 + }, + "17": { + "count": 100 + }, + "18": { + "count": 99 + }, + "19": { + "count": 100 + }, + "20": { + "count": 100 + }, + "21": { + "count": 100 + }, + "22": { + "count": 100 + }, + "23": { + "count": 100 + }, + "24": { + "count": 100 + }, + "25": { + "count": 100 + }, + "26": { + "count": 100 + }, + "27": { + "count": 100 + }, + "28": { + "count": 100 + }, + "29": { + "count": 100 + }, + "30": { + "count": 99 + }, + "31": { + "count": 100 + }, + "32": { + "count": 100 + }, + "33": { + "count": 100 + }, + "34": { + "count": 89 + }, + "35": { + "count": 100 + }, + "36": { + "count": 100 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/PatchCamelyon.json b/mteb/descriptive_stats/Image/ImageClassification/PatchCamelyon.json new file mode 100644 index 0000000000..e6b13afe50 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/PatchCamelyon.json @@ -0,0 +1,20 @@ +{ + "test": { + "num_samples": 32768, + "unique_num_labels": 2, + "min_image_width": 96, + "average_image_width": 96.0, + "max_image_width": 96, + "min_image_height": 96, + "average_image_height": 96.0, + "max_image_height": 96, + "labels": { + "0": { + "count": 16391 + }, + "1": { + "count": 16377 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/RESISC45.json b/mteb/descriptive_stats/Image/ImageClassification/RESISC45.json new file mode 100644 index 0000000000..f4a2290189 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/RESISC45.json @@ -0,0 +1,149 @@ +{ + "test": { + "num_samples": 6300, + "unique_num_labels": 45, + "min_image_width": 256, + "average_image_width": 256.0, + "max_image_width": 256, + "min_image_height": 256, + "average_image_height": 256.0, + "max_image_height": 256, + "labels": { + "31": { + "count": 135 + }, + "11": { + "count": 144 + }, + "28": { + "count": 135 + }, + "43": { + "count": 154 + }, + "41": { + "count": 144 + }, + "33": { + "count": 134 + }, + "19": { + "count": 130 + }, + "16": { + "count": 127 + }, + "22": { + "count": 130 + }, + "34": { + "count": 143 + }, + "24": { + "count": 164 + }, + "0": { + "count": 169 + }, + "13": { + "count": 146 + }, + "25": { + "count": 115 + }, + "6": { + "count": 132 + }, + "36": { + "count": 135 + }, + "39": { + "count": 142 + }, + "18": { + "count": 140 + }, + "23": { + "count": 147 + }, + "37": { + "count": 159 + }, + "15": { + "count": 122 + }, + "29": { + "count": 140 + }, + "9": { + "count": 159 + }, + "27": { + "count": 140 + }, + "21": { + "count": 131 + }, + "3": { + "count": 134 + }, + "1": { + "count": 162 + }, + "32": { + "count": 153 + }, + "26": { + "count": 150 + }, + "35": { + "count": 151 + }, + "44": { + "count": 118 + }, + "30": { + "count": 154 + }, + "20": { + "count": 139 + }, + "4": { + "count": 130 + }, + "42": { + "count": 127 + }, + "40": { + "count": 137 + }, + "5": { + "count": 140 + }, + "17": { + "count": 142 + }, + "2": { + "count": 123 + }, + "38": { + "count": 130 + }, + "10": { + "count": 140 + }, + "12": { + "count": 146 + }, + "8": { + "count": 146 + }, + "7": { + "count": 143 + }, + "14": { + "count": 118 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/STL10.json b/mteb/descriptive_stats/Image/ImageClassification/STL10.json new file mode 100644 index 0000000000..a647321290 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/STL10.json @@ -0,0 +1,44 @@ +{ + "test": { + "num_samples": 8000, + "unique_num_labels": 10, + "min_image_width": 96, + "average_image_width": 96.0, + "max_image_width": 96, + "min_image_height": 96, + "average_image_height": 96.0, + "max_image_height": 96, + "labels": { + "0": { + "count": 800 + }, + "1": { + "count": 800 + }, + "2": { + "count": 800 + }, + "3": { + "count": 800 + }, + "4": { + "count": 800 + }, + "5": { + "count": 800 + }, + "6": { + "count": 800 + }, + "7": { + "count": 800 + }, + "8": { + "count": 800 + }, + "9": { + "count": 800 + } + } + } +} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/StanfordCars.json b/mteb/descriptive_stats/Image/ImageClassification/StanfordCars.json new file mode 100644 index 0000000000..b1d5a9afc5 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/StanfordCars.json @@ -0,0 +1,602 @@ +{ + "test": { + "num_samples": 8041, + "unique_num_labels": 196, + "min_image_width": 78, + "average_image_width": 701.1770924014426, + "max_image_width": 7800, + "min_image_height": 41, + "average_image_height": 483.749658002736, + "max_image_height": 5400, + "labels": { + "180": { + "count": 38 + }, + "102": { + "count": 39 + }, + "144": { + "count": 44 + }, + "186": { + "count": 43 + }, + "184": { + "count": 38 + }, + "77": { + "count": 37 + }, + "117": { + "count": 41 + }, + "164": { + "count": 44 + }, + "31": { + "count": 41 + }, + "59": { + "count": 36 + }, + "48": { + "count": 37 + }, + "107": { + "count": 44 + }, + "115": { + "count": 37 + }, + "134": { + "count": 42 + }, + "82": { + "count": 40 + }, + "50": { + "count": 43 + }, + "153": { + "count": 42 + }, + "32": { + "count": 42 + }, + "21": { + "count": 42 + }, + "150": { + "count": 43 + }, + "3": { + "count": 42 + }, + "80": { + "count": 45 + }, + "106": { + "count": 44 + }, + "190": { + "count": 46 + }, + "169": { + "count": 44 + }, + "194": { + "count": 43 + }, + "90": { + "count": 38 + }, + "4": { + "count": 40 + }, + "163": { + "count": 43 + }, + "147": { + "count": 45 + }, + "187": { + "count": 43 + }, + "43": { + "count": 44 + }, + "6": { + "count": 39 + }, + "30": { + "count": 44 + }, + "73": { + "count": 43 + }, + "29": { + "count": 41 + }, + "165": { + "count": 41 + }, + "179": { + "count": 42 + }, + "105": { + "count": 41 + }, + "2": { + "count": 43 + }, + "64": { + "count": 45 + }, + "34": { + "count": 41 + }, + "74": { + "count": 44 + }, + "84": { + "count": 43 + }, + "24": { + "count": 39 + }, + "167": { + "count": 42 + }, + "136": { + "count": 43 + }, + "133": { + "count": 33 + }, + "155": { + "count": 39 + }, + "119": { + "count": 42 + }, + "129": { + "count": 41 + }, + "127": { + "count": 39 + }, + "35": { + "count": 41 + }, + "170": { + "count": 46 + }, + "36": { + "count": 38 + }, + "63": { + "count": 29 + }, + "182": { + "count": 42 + }, + "42": { + "count": 46 + }, + "17": { + "count": 42 + }, + "75": { + "count": 43 + }, + "0": { + "count": 44 + }, + "62": { + "count": 44 + }, + "173": { + "count": 41 + }, + "16": { + "count": 40 + }, + "104": { + "count": 43 + }, + "49": { + "count": 42 + }, + "122": { + "count": 44 + }, + "81": { + "count": 45 + }, + "191": { + "count": 42 + }, + "92": { + "count": 39 + }, + "145": { + "count": 43 + }, + "95": { + "count": 41 + }, + "54": { + "count": 39 + }, + "114": { + "count": 45 + }, + "112": { + "count": 42 + }, + "151": { + "count": 35 + }, + "91": { + "count": 40 + }, + "188": { + "count": 40 + }, + "20": { + "count": 42 + }, + "33": { + "count": 44 + }, + "86": { + "count": 44 + }, + "128": { + "count": 38 + }, + "142": { + "count": 40 + }, + "19": { + "count": 46 + }, + "177": { + "count": 41 + }, + "11": { + "count": 36 + }, + "45": { + "count": 43 + }, + "60": { + "count": 43 + }, + "8": { + "count": 41 + }, + "56": { + "count": 37 + }, + "28": { + "count": 42 + }, + "120": { + "count": 44 + }, + "5": { + "count": 44 + }, + "85": { + "count": 42 + }, + "68": { + "count": 38 + }, + "22": { + "count": 39 + }, + "108": { + "count": 44 + }, + "89": { + "count": 41 + }, + "132": { + "count": 42 + }, + "125": { + "count": 42 + }, + "137": { + "count": 39 + }, + "158": { + "count": 36 + }, + "58": { + "count": 44 + }, + "123": { + "count": 39 + }, + "52": { + "count": 44 + }, + "27": { + "count": 41 + }, + "13": { + "count": 42 + }, + "70": { + "count": 35 + }, + "25": { + "count": 34 + }, + "185": { + "count": 38 + }, + "171": { + "count": 44 + }, + "9": { + "count": 33 + }, + "40": { + "count": 35 + }, + "178": { + "count": 45 + }, + "44": { + "count": 32 + }, + "97": { + "count": 46 + }, + "87": { + "count": 39 + }, + "159": { + "count": 44 + }, + "146": { + "count": 44 + }, + "51": { + "count": 41 + }, + "121": { + "count": 40 + }, + "1": { + "count": 32 + }, + "160": { + "count": 48 + }, + "78": { + "count": 48 + }, + "109": { + "count": 43 + }, + "103": { + "count": 42 + }, + "174": { + "count": 30 + }, + "181": { + "count": 46 + }, + "23": { + "count": 45 + }, + "111": { + "count": 45 + }, + "166": { + "count": 47 + }, + "172": { + "count": 43 + }, + "66": { + "count": 38 + }, + "192": { + "count": 41 + }, + "148": { + "count": 42 + }, + "72": { + "count": 44 + }, + "141": { + "count": 32 + }, + "71": { + "count": 45 + }, + "7": { + "count": 45 + }, + "152": { + "count": 44 + }, + "183": { + "count": 40 + }, + "98": { + "count": 27 + }, + "94": { + "count": 45 + }, + "126": { + "count": 41 + }, + "100": { + "count": 42 + }, + "131": { + "count": 43 + }, + "116": { + "count": 42 + }, + "39": { + "count": 39 + }, + "149": { + "count": 36 + }, + "101": { + "count": 39 + }, + "139": { + "count": 42 + }, + "69": { + "count": 42 + }, + "12": { + "count": 41 + }, + "14": { + "count": 43 + }, + "96": { + "count": 42 + }, + "41": { + "count": 34 + }, + "189": { + "count": 43 + }, + "10": { + "count": 38 + }, + "140": { + "count": 34 + }, + "26": { + "count": 35 + }, + "57": { + "count": 44 + }, + "88": { + "count": 44 + }, + "67": { + "count": 40 + }, + "93": { + "count": 43 + }, + "193": { + "count": 45 + }, + "161": { + "count": 45 + }, + "118": { + "count": 68 + }, + "110": { + "count": 42 + }, + "154": { + "count": 42 + }, + "138": { + "count": 42 + }, + "143": { + "count": 46 + }, + "61": { + "count": 37 + }, + "176": { + "count": 44 + }, + "113": { + "count": 45 + }, + "18": { + "count": 40 + }, + "53": { + "count": 40 + }, + "47": { + "count": 42 + }, + "157": { + "count": 29 + }, + "168": { + "count": 38 + }, + "124": { + "count": 43 + }, + "79": { + "count": 43 + }, + "130": { + "count": 42 + }, + "46": { + "count": 35 + }, + "55": { + "count": 46 + }, + "195": { + "count": 40 + }, + "38": { + "count": 36 + }, + "37": { + "count": 40 + }, + "99": { + "count": 33 + }, + "83": { + "count": 42 + }, + "162": { + "count": 36 + }, + "135": { + "count": 24 + }, + "175": { + "count": 38 + }, + "156": { + "count": 36 + }, + "15": { + "count": 43 + }, + "65": { + "count": 41 + }, + "76": { + "count": 40 + } + } + } +} \ No newline at end of file diff --git a/mteb/encoder_interface.py b/mteb/encoder_interface.py index 5a66330cdc..db43c01521 100644 --- a/mteb/encoder_interface.py +++ b/mteb/encoder_interface.py @@ -1,6 +1,6 @@ from __future__ import annotations -from collections.abc import Sequence +from collections.abc import Iterable, Sequence from enum import Enum from typing import Any, Protocol, Union, runtime_checkable @@ -205,3 +205,47 @@ def get_fused_embeddings( # hmm what if I have a document with images at specif **kwargs: Any, ) -> np.ndarray: pass + + +class MultiModalEncoder: + """Extending the MTEB encoder interface to cover image, audio, and mixed modality cases. + """ + + def __init__(self, device: str | None, **kwargs: Any): + pass + + def encode( + self, + inputs: Iterable[str] # text + | Iterable[Image.Image] # images + | DataLoader #image data loader + | Iterable[tuple[Image.Image, str]] # image and text + | Iterable[tuple[DataLoader, list[str]]] # image dataloader and text + | Iterable[tuple[list[Image.Image], str]] # images and text + + | Iterable[Any], + *, + task_name: str, + prompt_type: PromptType | None = None, + **kwargs: Any, + ) -> np.ndarray: + """The encode method handles all input modalities. + # single modalities + text: Iterable[str] + images: Iterable[Image.Image] + audio: Iterable[audio] + + # current mixed cases from MIEB + image_and_text: Iterable[tuple[Image.Image, str]] + image_dataloader_and_text: Iterable[tuple[DataLoader, list[str]]] + images_and_text: Iterable[tuple[list[Image.Image], str]] + + # potential MAEB mixed case + audio_and_text: Iterable[tuple[audio,text] + + mixed: image_and_text | image_dataloader_and_text | images_and_text | audio_and_text + + # All together + inputs: text | images | audio | mixed + """ + pass diff --git a/mteb/models/lens_models.py b/mteb/models/lens_models.py index 46bc25c3de..c83bf2a3d0 100644 --- a/mteb/models/lens_models.py +++ b/mteb/models/lens_models.py @@ -3,7 +3,6 @@ from mteb.model_meta import ModelMeta from mteb.models.bge_models import bge_full_data - lens_d4000 = ModelMeta( loader=None, # TODO: implement this in the future name="yibinlei/LENS-d4000", From a738590fcc9146c7ed4903bc8b1c68168d940894 Mon Sep 17 00:00:00 2001 From: Isaac Chung Date: Sun, 16 Feb 2025 16:31:36 +0000 Subject: [PATCH 2/3] revert changes to encoder --- mteb/encoder_interface.py | 46 +-------------------------------------- 1 file changed, 1 insertion(+), 45 deletions(-) diff --git a/mteb/encoder_interface.py b/mteb/encoder_interface.py index db43c01521..5a66330cdc 100644 --- a/mteb/encoder_interface.py +++ b/mteb/encoder_interface.py @@ -1,6 +1,6 @@ from __future__ import annotations -from collections.abc import Iterable, Sequence +from collections.abc import Sequence from enum import Enum from typing import Any, Protocol, Union, runtime_checkable @@ -205,47 +205,3 @@ def get_fused_embeddings( # hmm what if I have a document with images at specif **kwargs: Any, ) -> np.ndarray: pass - - -class MultiModalEncoder: - """Extending the MTEB encoder interface to cover image, audio, and mixed modality cases. - """ - - def __init__(self, device: str | None, **kwargs: Any): - pass - - def encode( - self, - inputs: Iterable[str] # text - | Iterable[Image.Image] # images - | DataLoader #image data loader - | Iterable[tuple[Image.Image, str]] # image and text - | Iterable[tuple[DataLoader, list[str]]] # image dataloader and text - | Iterable[tuple[list[Image.Image], str]] # images and text - - | Iterable[Any], - *, - task_name: str, - prompt_type: PromptType | None = None, - **kwargs: Any, - ) -> np.ndarray: - """The encode method handles all input modalities. - # single modalities - text: Iterable[str] - images: Iterable[Image.Image] - audio: Iterable[audio] - - # current mixed cases from MIEB - image_and_text: Iterable[tuple[Image.Image, str]] - image_dataloader_and_text: Iterable[tuple[DataLoader, list[str]]] - images_and_text: Iterable[tuple[list[Image.Image], str]] - - # potential MAEB mixed case - audio_and_text: Iterable[tuple[audio,text] - - mixed: image_and_text | image_dataloader_and_text | images_and_text | audio_and_text - - # All together - inputs: text | images | audio | mixed - """ - pass From 2766d2fb8c7ef9e75e1fde604413c909c3d37fd2 Mon Sep 17 00:00:00 2001 From: Roman Solomatin <36135455+Samoed@users.noreply.github.com> Date: Mon, 17 Feb 2025 01:21:28 +0300 Subject: [PATCH 3/3] add stats --- mteb/descriptive_stats/Image/ImageClassification/Birdsnap.json | 1 + mteb/descriptive_stats/Image/ImageClassification/SUN397.json | 1 + mteb/descriptive_stats/Image/ImageClassification/UCF101.json | 1 + 3 files changed, 3 insertions(+) create mode 100644 mteb/descriptive_stats/Image/ImageClassification/Birdsnap.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/SUN397.json create mode 100644 mteb/descriptive_stats/Image/ImageClassification/UCF101.json diff --git a/mteb/descriptive_stats/Image/ImageClassification/Birdsnap.json b/mteb/descriptive_stats/Image/ImageClassification/Birdsnap.json new file mode 100644 index 0000000000..83d7d504c2 --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/Birdsnap.json @@ -0,0 +1 @@ +{"test": {"num_samples": 1851, "unique_num_labels": 490, "min_image_width": 267, "average_image_width": 2081.5569962182603, "max_image_width": 6400, "min_image_height": 200, "average_image_height": 1609.192868719611, "max_image_height": 5400, "labels": {"0": {"count": 4}, "1": {"count": 5}, "2": {"count": 4}, "3": {"count": 4}, "4": {"count": 4}, "5": {"count": 2}, "6": {"count": 3}, "7": {"count": 5}, "8": {"count": 4}, "9": {"count": 5}, "11": {"count": 3}, "12": {"count": 4}, "13": {"count": 5}, "14": {"count": 4}, "15": {"count": 5}, "16": {"count": 4}, "17": {"count": 3}, "18": {"count": 2}, "19": {"count": 5}, "20": {"count": 4}, "21": {"count": 4}, "22": {"count": 5}, "23": {"count": 2}, "24": {"count": 4}, "25": {"count": 3}, "26": {"count": 4}, "27": {"count": 4}, "28": {"count": 2}, "29": {"count": 5}, "30": {"count": 3}, "31": {"count": 3}, "32": {"count": 3}, "33": {"count": 4}, "34": {"count": 4}, "35": {"count": 4}, "36": {"count": 3}, "37": {"count": 3}, "38": {"count": 4}, "39": {"count": 3}, "40": {"count": 4}, "41": {"count": 3}, "42": {"count": 3}, "43": {"count": 4}, "44": {"count": 2}, "45": {"count": 3}, "47": {"count": 5}, "48": {"count": 2}, "49": {"count": 5}, "50": {"count": 4}, "51": {"count": 5}, "52": {"count": 3}, "53": {"count": 3}, "54": {"count": 4}, "55": {"count": 2}, "56": {"count": 2}, "57": {"count": 5}, "58": {"count": 2}, "59": {"count": 1}, "60": {"count": 1}, "61": {"count": 3}, "62": {"count": 3}, "63": {"count": 5}, "64": {"count": 5}, "65": {"count": 4}, "67": {"count": 2}, "68": {"count": 3}, "69": {"count": 4}, "70": {"count": 5}, "71": {"count": 5}, "72": {"count": 5}, "73": {"count": 4}, "74": {"count": 5}, "75": {"count": 4}, "76": {"count": 4}, "80": {"count": 3}, "81": {"count": 5}, "82": {"count": 3}, "83": {"count": 5}, "84": {"count": 3}, "85": {"count": 4}, "86": {"count": 4}, "87": {"count": 5}, "88": {"count": 4}, "89": {"count": 5}, "90": {"count": 4}, "91": {"count": 4}, "92": {"count": 5}, "93": {"count": 4}, "94": {"count": 4}, "95": {"count": 5}, "96": {"count": 5}, "97": {"count": 5}, "98": {"count": 3}, "99": {"count": 5}, "100": {"count": 4}, "101": {"count": 5}, "102": {"count": 4}, "103": {"count": 3}, "105": {"count": 4}, "108": {"count": 4}, "109": {"count": 5}, "110": {"count": 3}, "111": {"count": 3}, "112": {"count": 4}, "113": {"count": 4}, "114": {"count": 5}, "115": {"count": 4}, "116": {"count": 5}, "117": {"count": 4}, "118": {"count": 4}, "119": {"count": 5}, "120": {"count": 5}, "121": {"count": 4}, "122": {"count": 3}, "124": {"count": 3}, "125": {"count": 4}, "126": {"count": 2}, "127": {"count": 3}, "128": {"count": 5}, "129": {"count": 5}, "130": {"count": 5}, "131": {"count": 3}, "132": {"count": 4}, "133": {"count": 4}, "134": {"count": 2}, "135": {"count": 5}, "136": {"count": 5}, "137": {"count": 3}, "138": {"count": 4}, "139": {"count": 3}, "140": {"count": 3}, "141": {"count": 2}, "142": {"count": 3}, "143": {"count": 5}, "144": {"count": 4}, "145": {"count": 5}, "146": {"count": 5}, "147": {"count": 5}, "148": {"count": 4}, "149": {"count": 4}, "150": {"count": 5}, "151": {"count": 5}, "152": {"count": 5}, "153": {"count": 3}, "154": {"count": 4}, "155": {"count": 3}, "156": {"count": 3}, "157": {"count": 3}, "159": {"count": 3}, "160": {"count": 4}, "161": {"count": 4}, "162": {"count": 4}, "163": {"count": 4}, "164": {"count": 3}, "165": {"count": 3}, "166": {"count": 3}, "167": {"count": 4}, "168": {"count": 4}, "169": {"count": 4}, "170": {"count": 4}, "171": {"count": 5}, "172": {"count": 4}, "173": {"count": 4}, "174": {"count": 5}, "175": {"count": 4}, "176": {"count": 2}, "177": {"count": 5}, "178": {"count": 5}, "179": {"count": 5}, "180": {"count": 5}, "181": {"count": 4}, "183": {"count": 2}, "184": {"count": 3}, "185": {"count": 2}, "186": {"count": 5}, "187": {"count": 2}, "188": {"count": 3}, "189": {"count": 2}, "190": {"count": 5}, "191": {"count": 4}, "192": {"count": 3}, "193": {"count": 3}, "194": {"count": 4}, "195": {"count": 3}, "196": {"count": 4}, "197": {"count": 3}, "198": {"count": 4}, "199": {"count": 5}, "200": {"count": 5}, "201": {"count": 1}, "204": {"count": 4}, "205": {"count": 5}, "206": {"count": 4}, "207": {"count": 3}, "208": {"count": 4}, "209": {"count": 4}, "210": {"count": 4}, "211": {"count": 4}, "212": {"count": 5}, "213": {"count": 4}, "214": {"count": 5}, "215": {"count": 3}, "216": {"count": 1}, "217": {"count": 5}, "218": {"count": 2}, "219": {"count": 5}, "220": {"count": 4}, "221": {"count": 5}, "222": {"count": 5}, "223": {"count": 3}, "224": {"count": 4}, "225": {"count": 5}, "226": {"count": 3}, "227": {"count": 4}, "228": {"count": 3}, "229": {"count": 4}, "230": {"count": 4}, "231": {"count": 5}, "232": {"count": 5}, "233": {"count": 5}, "234": {"count": 4}, "235": {"count": 4}, "236": {"count": 5}, "237": {"count": 5}, "238": {"count": 5}, "239": {"count": 4}, "240": {"count": 3}, "241": {"count": 3}, "242": {"count": 4}, "243": {"count": 5}, "244": {"count": 2}, "245": {"count": 4}, "246": {"count": 5}, "247": {"count": 3}, "248": {"count": 3}, "249": {"count": 5}, "250": {"count": 5}, "251": {"count": 4}, "252": {"count": 2}, "253": {"count": 5}, "254": {"count": 5}, "255": {"count": 5}, "256": {"count": 4}, "257": {"count": 4}, "258": {"count": 4}, "259": {"count": 3}, "260": {"count": 5}, "261": {"count": 4}, "262": {"count": 4}, "264": {"count": 4}, "265": {"count": 3}, "266": {"count": 5}, "267": {"count": 5}, "268": {"count": 3}, "269": {"count": 2}, "270": {"count": 3}, "271": {"count": 4}, "272": {"count": 4}, "273": {"count": 5}, "274": {"count": 5}, "275": {"count": 5}, "276": {"count": 2}, "277": {"count": 3}, "278": {"count": 5}, "279": {"count": 5}, "280": {"count": 4}, "281": {"count": 5}, "282": {"count": 5}, "283": {"count": 3}, "284": {"count": 5}, "285": {"count": 3}, "286": {"count": 5}, "287": {"count": 5}, "288": {"count": 4}, "289": {"count": 4}, "290": {"count": 5}, "291": {"count": 3}, "292": {"count": 2}, "293": {"count": 1}, "294": {"count": 1}, "295": {"count": 2}, "296": {"count": 4}, "297": {"count": 5}, "298": {"count": 4}, "300": {"count": 3}, "301": {"count": 3}, "303": {"count": 4}, "304": {"count": 4}, "305": {"count": 4}, "306": {"count": 2}, "307": {"count": 5}, "308": {"count": 4}, "309": {"count": 2}, "310": {"count": 3}, "311": {"count": 3}, "312": {"count": 4}, "313": {"count": 3}, "314": {"count": 3}, "315": {"count": 3}, "316": {"count": 5}, "317": {"count": 4}, "318": {"count": 5}, "319": {"count": 4}, "320": {"count": 4}, "321": {"count": 3}, "322": {"count": 5}, "323": {"count": 4}, "324": {"count": 2}, "325": {"count": 1}, "326": {"count": 3}, "327": {"count": 4}, "328": {"count": 3}, "330": {"count": 4}, "331": {"count": 4}, "332": {"count": 2}, "333": {"count": 5}, "334": {"count": 5}, "335": {"count": 5}, "336": {"count": 4}, "337": {"count": 4}, "338": {"count": 5}, "339": {"count": 3}, "340": {"count": 5}, "341": {"count": 5}, "342": {"count": 5}, "343": {"count": 2}, "344": {"count": 2}, "345": {"count": 3}, "346": {"count": 3}, "347": {"count": 5}, "348": {"count": 3}, "349": {"count": 2}, "350": {"count": 4}, "352": {"count": 5}, "353": {"count": 3}, "354": {"count": 5}, "355": {"count": 5}, "356": {"count": 4}, "357": {"count": 3}, "358": {"count": 3}, "359": {"count": 4}, "360": {"count": 5}, "361": {"count": 5}, "362": {"count": 4}, "363": {"count": 3}, "364": {"count": 4}, "365": {"count": 1}, "366": {"count": 4}, "367": {"count": 3}, "368": {"count": 4}, "369": {"count": 3}, "370": {"count": 5}, "371": {"count": 3}, "372": {"count": 5}, "373": {"count": 4}, "374": {"count": 4}, "375": {"count": 3}, "376": {"count": 4}, "377": {"count": 4}, "378": {"count": 4}, "379": {"count": 4}, "380": {"count": 4}, "381": {"count": 4}, "382": {"count": 1}, "383": {"count": 4}, "384": {"count": 4}, "385": {"count": 4}, "386": {"count": 2}, "387": {"count": 4}, "388": {"count": 2}, "389": {"count": 5}, "390": {"count": 4}, "391": {"count": 5}, "392": {"count": 4}, "394": {"count": 4}, "395": {"count": 4}, "396": {"count": 4}, "397": {"count": 4}, "398": {"count": 5}, "399": {"count": 4}, "400": {"count": 5}, "401": {"count": 4}, "402": {"count": 4}, "404": {"count": 5}, "405": {"count": 5}, "406": {"count": 5}, "407": {"count": 4}, "408": {"count": 2}, "409": {"count": 4}, "410": {"count": 3}, "411": {"count": 5}, "412": {"count": 4}, "413": {"count": 3}, "414": {"count": 4}, "415": {"count": 4}, "416": {"count": 4}, "417": {"count": 5}, "418": {"count": 3}, "419": {"count": 5}, "421": {"count": 4}, "422": {"count": 3}, "423": {"count": 5}, "424": {"count": 5}, "425": {"count": 2}, "426": {"count": 5}, "427": {"count": 4}, "428": {"count": 5}, "429": {"count": 3}, "430": {"count": 2}, "431": {"count": 3}, "432": {"count": 5}, "433": {"count": 4}, "434": {"count": 3}, "435": {"count": 3}, "437": {"count": 3}, "438": {"count": 5}, "439": {"count": 2}, "440": {"count": 4}, "441": {"count": 4}, "442": {"count": 5}, "443": {"count": 2}, "444": {"count": 3}, "445": {"count": 3}, "446": {"count": 5}, "447": {"count": 3}, "448": {"count": 2}, "449": {"count": 1}, "450": {"count": 3}, "451": {"count": 3}, "452": {"count": 4}, "453": {"count": 2}, "454": {"count": 4}, "455": {"count": 4}, "456": {"count": 5}, "458": {"count": 4}, "459": {"count": 4}, "460": {"count": 5}, "461": {"count": 4}, "462": {"count": 4}, "463": {"count": 5}, "464": {"count": 5}, "466": {"count": 2}, "467": {"count": 4}, "468": {"count": 3}, "469": {"count": 5}, "470": {"count": 5}, "471": {"count": 2}, "472": {"count": 4}, "473": {"count": 3}, "474": {"count": 5}, "475": {"count": 5}, "476": {"count": 5}, "477": {"count": 4}, "478": {"count": 2}, "479": {"count": 4}, "480": {"count": 4}, "481": {"count": 5}, "482": {"count": 4}, "483": {"count": 3}, "484": {"count": 5}, "485": {"count": 5}, "486": {"count": 4}, "487": {"count": 3}, "488": {"count": 3}, "489": {"count": 1}, "490": {"count": 1}, "491": {"count": 2}, "492": {"count": 4}, "493": {"count": 4}, "494": {"count": 3}, "495": {"count": 4}, "496": {"count": 5}, "497": {"count": 5}, "498": {"count": 5}, "499": {"count": 4}, "79": {"count": 4}, "106": {"count": 4}, "107": {"count": 4}, "202": {"count": 1}, "203": {"count": 1}, "457": {"count": 3}, "77": {"count": 2}, "78": {"count": 4}, "182": {"count": 2}, "263": {"count": 4}, "104": {"count": 1}, "158": {"count": 5}, "329": {"count": 1}, "393": {"count": 2}, "420": {"count": 2}}}} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/SUN397.json b/mteb/descriptive_stats/Image/ImageClassification/SUN397.json new file mode 100644 index 0000000000..cd840269be --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/SUN397.json @@ -0,0 +1 @@ +{"test": {"num_samples": 21750, "unique_num_labels": 397, "min_image_width": 125, "average_image_width": 354.21843678160917, "max_image_width": 696, "min_image_height": 94, "average_image_height": 291.1662988505747, "max_image_height": 595, "labels": {"227": {"count": 439}, "213": {"count": 335}, "53": {"count": 23}, "350": {"count": 40}, "73": {"count": 38}, "316": {"count": 63}, "177": {"count": 80}, "25": {"count": 39}, "275": {"count": 31}, "328": {"count": 33}, "263": {"count": 47}, "239": {"count": 26}, "41": {"count": 213}, "319": {"count": 51}, "91": {"count": 16}, "95": {"count": 183}, "396": {"count": 20}, "259": {"count": 36}, "107": {"count": 167}, "381": {"count": 164}, "174": {"count": 167}, "246": {"count": 44}, "67": {"count": 31}, "374": {"count": 28}, "354": {"count": 22}, "72": {"count": 100}, "97": {"count": 32}, "256": {"count": 57}, "247": {"count": 57}, "159": {"count": 49}, "270": {"count": 135}, "133": {"count": 215}, "197": {"count": 40}, "12": {"count": 38}, "2": {"count": 226}, "115": {"count": 75}, "200": {"count": 93}, "47": {"count": 103}, "9": {"count": 37}, "22": {"count": 76}, "255": {"count": 34}, "267": {"count": 22}, "244": {"count": 93}, "85": {"count": 115}, "342": {"count": 87}, "55": {"count": 50}, "7": {"count": 41}, "337": {"count": 99}, "38": {"count": 28}, "269": {"count": 69}, "106": {"count": 15}, "298": {"count": 27}, "361": {"count": 53}, "8": {"count": 108}, "166": {"count": 47}, "280": {"count": 51}, "35": {"count": 61}, "147": {"count": 82}, "214": {"count": 26}, "284": {"count": 28}, "286": {"count": 66}, "113": {"count": 67}, "83": {"count": 38}, "82": {"count": 236}, "365": {"count": 17}, "242": {"count": 116}, "186": {"count": 38}, "87": {"count": 111}, "274": {"count": 48}, "27": {"count": 95}, "283": {"count": 22}, "4": {"count": 76}, "334": {"count": 139}, "364": {"count": 21}, "48": {"count": 408}, "311": {"count": 41}, "101": {"count": 64}, "131": {"count": 55}, "172": {"count": 31}, "355": {"count": 28}, "308": {"count": 56}, "5": {"count": 47}, "318": {"count": 155}, "86": {"count": 87}, "46": {"count": 230}, "111": {"count": 69}, "88": {"count": 54}, "23": {"count": 47}, "70": {"count": 61}, "217": {"count": 34}, "11": {"count": 76}, "193": {"count": 207}, "0": {"count": 99}, "303": {"count": 23}, "324": {"count": 47}, "377": {"count": 19}, "345": {"count": 39}, "154": {"count": 49}, "393": {"count": 68}, "152": {"count": 58}, "317": {"count": 27}, "384": {"count": 46}, "257": {"count": 38}, "294": {"count": 47}, "145": {"count": 23}, "289": {"count": 33}, "375": {"count": 19}, "57": {"count": 42}, "15": {"count": 62}, "109": {"count": 24}, "139": {"count": 24}, "66": {"count": 26}, "340": {"count": 32}, "150": {"count": 41}, "118": {"count": 105}, "333": {"count": 27}, "126": {"count": 55}, "366": {"count": 116}, "358": {"count": 151}, "251": {"count": 37}, "309": {"count": 35}, "54": {"count": 20}, "327": {"count": 38}, "3": {"count": 60}, "21": {"count": 56}, "17": {"count": 62}, "146": {"count": 84}, "94": {"count": 42}, "243": {"count": 48}, "335": {"count": 85}, "245": {"count": 141}, "279": {"count": 187}, "360": {"count": 25}, "192": {"count": 105}, "49": {"count": 31}, "230": {"count": 81}, "357": {"count": 22}, "64": {"count": 72}, "112": {"count": 26}, "338": {"count": 70}, "216": {"count": 99}, "234": {"count": 183}, "300": {"count": 153}, "188": {"count": 48}, "254": {"count": 41}, "184": {"count": 183}, "373": {"count": 47}, "221": {"count": 86}, "84": {"count": 49}, "81": {"count": 119}, "161": {"count": 97}, "352": {"count": 21}, "105": {"count": 43}, "39": {"count": 59}, "383": {"count": 40}, "341": {"count": 56}, "63": {"count": 158}, "125": {"count": 29}, "302": {"count": 83}, "262": {"count": 40}, "392": {"count": 51}, "326": {"count": 173}, "228": {"count": 93}, "339": {"count": 25}, "80": {"count": 73}, "30": {"count": 42}, "264": {"count": 112}, "56": {"count": 94}, "321": {"count": 16}, "395": {"count": 52}, "68": {"count": 45}, "211": {"count": 45}, "44": {"count": 26}, "299": {"count": 21}, "220": {"count": 35}, "61": {"count": 20}, "138": {"count": 55}, "108": {"count": 111}, "10": {"count": 35}, "386": {"count": 28}, "297": {"count": 49}, "210": {"count": 36}, "175": {"count": 77}, "260": {"count": 68}, "391": {"count": 69}, "102": {"count": 77}, "26": {"count": 44}, "232": {"count": 54}, "6": {"count": 158}, "124": {"count": 43}, "14": {"count": 23}, "201": {"count": 39}, "168": {"count": 18}, "202": {"count": 26}, "140": {"count": 31}, "261": {"count": 60}, "104": {"count": 27}, "356": {"count": 22}, "34": {"count": 147}, "225": {"count": 111}, "60": {"count": 84}, "156": {"count": 35}, "237": {"count": 45}, "268": {"count": 87}, "310": {"count": 31}, "249": {"count": 73}, "281": {"count": 46}, "75": {"count": 89}, "77": {"count": 53}, "132": {"count": 45}, "235": {"count": 42}, "336": {"count": 84}, "123": {"count": 27}, "349": {"count": 90}, "180": {"count": 49}, "378": {"count": 17}, "332": {"count": 30}, "185": {"count": 29}, "389": {"count": 60}, "382": {"count": 77}, "198": {"count": 54}, "74": {"count": 48}, "231": {"count": 85}, "76": {"count": 54}, "151": {"count": 64}, "182": {"count": 17}, "209": {"count": 39}, "344": {"count": 37}, "204": {"count": 67}, "329": {"count": 23}, "380": {"count": 91}, "388": {"count": 32}, "116": {"count": 29}, "24": {"count": 103}, "199": {"count": 33}, "369": {"count": 14}, "359": {"count": 77}, "325": {"count": 39}, "323": {"count": 34}, "162": {"count": 35}, "33": {"count": 46}, "129": {"count": 21}, "287": {"count": 30}, "155": {"count": 24}, "170": {"count": 157}, "296": {"count": 40}, "110": {"count": 102}, "304": {"count": 21}, "164": {"count": 37}, "278": {"count": 23}, "71": {"count": 18}, "194": {"count": 24}, "136": {"count": 117}, "103": {"count": 134}, "330": {"count": 26}, "347": {"count": 26}, "206": {"count": 50}, "178": {"count": 43}, "362": {"count": 26}, "119": {"count": 111}, "208": {"count": 33}, "165": {"count": 44}, "90": {"count": 36}, "167": {"count": 40}, "187": {"count": 26}, "99": {"count": 50}, "390": {"count": 64}, "205": {"count": 16}, "65": {"count": 30}, "293": {"count": 23}, "223": {"count": 19}, "96": {"count": 31}, "305": {"count": 44}, "100": {"count": 57}, "385": {"count": 18}, "78": {"count": 42}, "59": {"count": 20}, "37": {"count": 59}, "219": {"count": 76}, "212": {"count": 28}, "1": {"count": 26}, "122": {"count": 35}, "92": {"count": 62}, "43": {"count": 39}, "196": {"count": 56}, "19": {"count": 25}, "128": {"count": 35}, "376": {"count": 77}, "313": {"count": 30}, "114": {"count": 54}, "121": {"count": 31}, "169": {"count": 62}, "331": {"count": 55}, "238": {"count": 16}, "179": {"count": 31}, "127": {"count": 31}, "370": {"count": 98}, "149": {"count": 47}, "346": {"count": 41}, "250": {"count": 22}, "276": {"count": 25}, "163": {"count": 43}, "18": {"count": 33}, "282": {"count": 23}, "215": {"count": 33}, "258": {"count": 60}, "240": {"count": 29}, "233": {"count": 14}, "93": {"count": 27}, "69": {"count": 23}, "266": {"count": 26}, "387": {"count": 55}, "141": {"count": 18}, "191": {"count": 26}, "183": {"count": 42}, "271": {"count": 22}, "120": {"count": 32}, "98": {"count": 53}, "29": {"count": 34}, "28": {"count": 21}, "144": {"count": 26}, "351": {"count": 50}, "368": {"count": 20}, "314": {"count": 27}, "45": {"count": 17}, "218": {"count": 50}, "348": {"count": 25}, "157": {"count": 35}, "117": {"count": 24}, "367": {"count": 24}, "13": {"count": 31}, "363": {"count": 22}, "79": {"count": 28}, "312": {"count": 27}, "372": {"count": 29}, "189": {"count": 21}, "50": {"count": 22}, "160": {"count": 35}, "16": {"count": 39}, "222": {"count": 21}, "58": {"count": 37}, "153": {"count": 64}, "62": {"count": 21}, "290": {"count": 25}, "292": {"count": 24}, "285": {"count": 25}, "343": {"count": 32}, "301": {"count": 19}, "190": {"count": 46}, "195": {"count": 24}, "135": {"count": 30}, "315": {"count": 25}, "203": {"count": 29}, "307": {"count": 18}, "142": {"count": 25}, "173": {"count": 28}, "236": {"count": 41}, "171": {"count": 23}, "371": {"count": 17}, "130": {"count": 15}, "277": {"count": 39}, "248": {"count": 22}, "181": {"count": 35}, "40": {"count": 20}, "322": {"count": 15}, "273": {"count": 23}, "148": {"count": 23}, "295": {"count": 25}, "32": {"count": 21}, "320": {"count": 25}, "137": {"count": 32}, "253": {"count": 36}, "31": {"count": 19}, "306": {"count": 27}, "51": {"count": 19}, "52": {"count": 29}, "176": {"count": 31}, "241": {"count": 23}, "265": {"count": 32}, "394": {"count": 26}, "158": {"count": 26}, "226": {"count": 28}, "288": {"count": 21}, "353": {"count": 19}, "291": {"count": 21}, "224": {"count": 26}, "36": {"count": 38}, "20": {"count": 22}, "252": {"count": 18}, "134": {"count": 24}, "143": {"count": 21}, "207": {"count": 28}, "89": {"count": 16}, "272": {"count": 23}, "379": {"count": 24}, "229": {"count": 20}, "42": {"count": 23}}}} \ No newline at end of file diff --git a/mteb/descriptive_stats/Image/ImageClassification/UCF101.json b/mteb/descriptive_stats/Image/ImageClassification/UCF101.json new file mode 100644 index 0000000000..be8f90403a --- /dev/null +++ b/mteb/descriptive_stats/Image/ImageClassification/UCF101.json @@ -0,0 +1 @@ +{"test": {"num_samples": 697222, "unique_num_labels": 101, "min_image_width": 320, "average_image_width": 320.1187570099624, "max_image_width": 400, "min_image_height": 226, "average_image_height": 239.97921752325658, "max_image_height": 240, "labels": {"0": {"count": 7475}, "1": {"count": 6341}, "2": {"count": 6181}, "3": {"count": 6320}, "4": {"count": 3708}, "5": {"count": 7296}, "6": {"count": 4004}, "7": {"count": 3923}, "8": {"count": 2267}, "9": {"count": 5587}, "10": {"count": 8946}, "11": {"count": 12714}, "12": {"count": 6053}, "13": {"count": 3191}, "14": {"count": 3696}, "15": {"count": 5468}, "16": {"count": 10032}, "17": {"count": 8346}, "18": {"count": 5098}, "19": {"count": 10811}, "20": {"count": 6378}, "21": {"count": 3385}, "22": {"count": 3974}, "23": {"count": 4781}, "24": {"count": 5867}, "25": {"count": 7904}, "26": {"count": 12181}, "27": {"count": 4511}, "28": {"count": 4402}, "29": {"count": 5513}, "30": {"count": 3236}, "31": {"count": 7160}, "32": {"count": 6455}, "33": {"count": 3766}, "34": {"count": 8362}, "35": {"count": 3521}, "36": {"count": 3263}, "37": {"count": 5112}, "38": {"count": 9685}, "39": {"count": 4598}, "40": {"count": 6682}, "41": {"count": 8690}, "42": {"count": 3591}, "43": {"count": 11432}, "44": {"count": 3458}, "45": {"count": 10080}, "46": {"count": 16507}, "47": {"count": 3001}, "48": {"count": 6524}, "49": {"count": 7786}, "50": {"count": 4657}, "51": {"count": 8795}, "52": {"count": 3992}, "53": {"count": 5668}, "54": {"count": 6575}, "55": {"count": 8662}, "56": {"count": 5253}, "57": {"count": 3761}, "58": {"count": 8679}, "59": {"count": 11986}, "60": {"count": 15720}, "61": {"count": 12080}, "62": {"count": 10634}, "63": {"count": 6161}, "64": {"count": 13934}, "65": {"count": 8393}, "66": {"count": 5452}, "67": {"count": 7905}, "68": {"count": 12354}, "69": {"count": 4060}, "70": {"count": 9075}, "71": {"count": 2689}, "72": {"count": 5435}, "73": {"count": 17655}, "74": {"count": 5693}, "75": {"count": 12572}, "76": {"count": 9543}, "77": {"count": 10793}, "78": {"count": 4134}, "79": {"count": 4832}, "80": {"count": 8977}, "81": {"count": 7381}, "82": {"count": 4927}, "83": {"count": 12469}, "84": {"count": 3843}, "85": {"count": 4945}, "86": {"count": 6724}, "87": {"count": 6582}, "88": {"count": 7046}, "89": {"count": 5874}, "90": {"count": 4878}, "91": {"count": 6417}, "92": {"count": 3762}, "93": {"count": 7349}, "94": {"count": 8149}, "95": {"count": 3925}, "96": {"count": 3378}, "97": {"count": 7721}, "98": {"count": 3671}, "99": {"count": 6292}, "100": {"count": 6508}}}} \ No newline at end of file