From fb66000d158f0a231f0f825a63b4a650845d77e7 Mon Sep 17 00:00:00 2001
From: Jay Lee <ljay189@gmail.com>
Date: Sat, 21 May 2022 20:00:55 +0900
Subject: [PATCH 01/15] Added automated basic model export to CI

---
 .github/workflows/ci-testing.yml |  12 +++
 requirements.txt                 |   3 +
 tests/conftest.py                |   7 ++
 tests/test_export.py             | 140 +++++++++++++++++++++++++++++++
 4 files changed, 162 insertions(+)
 create mode 100644 tests/conftest.py
 create mode 100644 tests/test_export.py

diff --git a/.github/workflows/ci-testing.yml b/.github/workflows/ci-testing.yml
index e5d5fc434f06..0bf7fca53914 100644
--- a/.github/workflows/ci-testing.yml
+++ b/.github/workflows/ci-testing.yml
@@ -91,3 +91,15 @@ jobs:
           EOF
 
         shell: bash
+
+      - name: install pytest dependencies
+        run: |
+          pip install -r requirements.txt coremltools onnx onnx-simplifier onnxruntime openvino-dev tensorflow-cpu
+        shell: bash
+
+      - name: Run pytest
+        run: |
+          # Weights should be available from previous workflow
+          weights=runs/train/exp/weights/best.pt
+          pytest tests --weights $weights
+        shell: bash
diff --git a/requirements.txt b/requirements.txt
index 4cf22b7093b4..fbe0ef1e6820 100755
--- a/requirements.txt
+++ b/requirements.txt
@@ -20,6 +20,9 @@ tensorboard>=2.4.1
 pandas>=1.1.4
 seaborn>=0.11.0
 
+# Test ----------------------------------------
+pytest
+
 # Export --------------------------------------
 # coremltools>=4.1  # CoreML export
 # onnx>=1.9.0  # ONNX export
diff --git a/tests/conftest.py b/tests/conftest.py
new file mode 100644
index 000000000000..6af0fbb47151
--- /dev/null
+++ b/tests/conftest.py
@@ -0,0 +1,7 @@
+
+_REQUIRED_ARGUMENTS = ('weights',)
+
+
+def pytest_addoption(parser):
+    for argument in _REQUIRED_ARGUMENTS:
+        parser.addoption(f'--{argument}', default=None)
diff --git a/tests/test_export.py b/tests/test_export.py
new file mode 100644
index 000000000000..afaa1defcf5c
--- /dev/null
+++ b/tests/test_export.py
@@ -0,0 +1,140 @@
+"""
+Tests intended to run on CI to ensure that models are being correctly serialized.
+To run the tests, first install the requirements by typing in:
+pip install -r requirements.txt
+Afterwards, from the project's root, type in:
+pytest tests --weights="yolov5s.pt"
+Check out the pytest website for more information
+"""
+import os
+import shutil
+import stat
+import subprocess
+import sys
+import typing as t
+from pathlib import Path
+
+import pytest
+import torch
+
+FILE = Path(__file__).resolve()
+ROOT = FILE.parents[1]  # YOLOv5 root directory
+if str(ROOT) not in sys.path:
+    sys.path.append(str(ROOT))  # add ROOT to PATH
+
+from export import export_formats, run
+
+# Fixtures
+# ----------------------
+
+
+@pytest.fixture(scope='session')
+def weights(pytestconfig):
+    return pytestconfig.getoption('weights')
+
+
+@pytest.fixture(scope='session')
+def cleanup(weights):
+    yield
+    for _, export_format_argument, suffix, ___ in cpu_export_formats():
+        output_path = weights.replace('.pt', suffix.lower())
+        if export_format_argument == 'tflite':
+            output_path = output_path.replace('.tflite', f'-int8.tflite')
+        elif export_format_argument == 'edgetpu':
+            output_path = output_path.replace('.tflite', f'-int8_edgetpu.tflite')
+        if os.path.exists(output_path):
+            if os.path.isdir(output_path):
+                shutil.rmtree(output_path, onerror=del_rw)
+            else:
+                os.chmod(output_path, stat.S_IWRITE)
+                os.remove(output_path)
+
+
+# Utils
+# ---------------------
+
+def del_rw(action, file_path, exc):
+    os.chmod(file_path, stat.S_IWRITE)
+    os.remove(file_path)
+
+
+def gpu_export_formats():
+    formats = export_formats()
+    return formats[formats['GPU'] == True].values.tolist()
+
+
+def cpu_export_formats() -> t.List:
+    """
+    Get list of models that can be exported without gpu.
+    Note that some of these require special environments to serialize.
+    """
+    formats = export_formats()
+    return formats[formats['Format'].isin(
+        ('ONNX', 'OpenVINO', 'CoreML', 'TensorFlow SavedModel', 'TensorFlow GraphDef',
+        'TensorFlow Lite', 'TensorFlow Edge TPU', 'TensorFlow.js',)
+    )].values.tolist()
+
+
+# Tests
+# ----------------------
+
+def test_model_exists(weights: str):
+    """
+    Raise an error if model in specified path does not exist
+    Args:
+        weights: The path to yolov5 weight
+    """
+    assert weights is not None, 'Please specify --weights when running pytest.'
+    assert weights.endswith('.pt'), f'weights must end with ".pt". Passed in: {weights}'
+    assert os.path.exists(weights), f'Weights could not be found in: "{weights}"'
+
+
+@pytest.mark.usefixtures('cleanup')
+@pytest.mark.parametrize('export_format_row', cpu_export_formats())
+def test_export_cpu(weights, export_format_row: t.List):
+    _, export_format_argument, suffix, ___ = export_format_row
+    if export_format_argument in ('engine', 'coreml'):
+        pytest.skip(f'Export format: "{export_format_argument}" requires special environment. Skipping.')
+
+    # make img small for quick tests
+    img_sz = (160, 160)
+
+    # As of now, openvino requires numpy < 1.20.
+    # numpy will be downgraded during openvino run
+    # so we need to re-upgrade numpy
+    if export_format_argument == 'openvino':
+        subprocess.run('pip install numpy==1.19.5', shell=True)
+    elif export_format_argument == 'tfjs':
+        subprocess.run('pip install --upgrade numpy', shell=True)
+
+    # create the model
+    run(weights=weights, imgsz=img_sz, include=(export_format_argument,), int8=True)
+    output_path = weights.replace('.pt', suffix.lower())
+
+    if os.path.isdir(output_path):
+        # For now, we do a simple check to see whether files are not empty
+        directory = os.fsencode(output_path)
+        file_count = 0
+        for subdir, dirs, files in os.walk(directory):
+            for file in files:
+                file_path = os.path.join(subdir, file)
+                file_count += 1
+                file_is_not_empty = os.stat(file_path).st_size > 0
+                assert file_is_not_empty, f'File: "{file_path}" should not be empty.'
+        # Serialized folder should contain at least one file
+        assert file_count > 0, 'Folder is empty'
+    else:
+        if export_format_argument == 'tflite':
+            output_path = weights.replace('.tflite', f'-int8.tflite')
+        elif export_format_argument == 'edgetpu':
+            output_path = weights.replace('.tflite', f'-int8_edgetpu.tflite')
+        assert os.path.exists(output_path), f'Failed to serialize "{output_path}".'
+
+    # TODO: we can add new tests to check mAP of the exported model on VOC dataset
+
+
+@pytest.mark.skipif(not torch.cuda.is_available(), reason='Test requires cuda')
+@pytest.mark.parametrize('export_format_row', gpu_export_formats())
+def test_export_gpu(export_format_row: t.List):
+    # TODO: Test when runner with GPU is available
+    pass

From 4bcb03941dc3ae205b3dc9529d9d45e0bc631608 Mon Sep 17 00:00:00 2001
From: Jay Lee <ljay189@gmail.com>
Date: Sat, 21 May 2022 20:09:48 +0900
Subject: [PATCH 02/15] Flake8 fix

---
 tests/test_export.py | 26 +++++++++++++++++---------
 1 file changed, 17 insertions(+), 9 deletions(-)

diff --git a/tests/test_export.py b/tests/test_export.py
index afaa1defcf5c..191bb8d9f251 100644
--- a/tests/test_export.py
+++ b/tests/test_export.py
@@ -39,9 +39,9 @@ def cleanup(weights):
     for _, export_format_argument, suffix, ___ in cpu_export_formats():
         output_path = weights.replace('.pt', suffix.lower())
         if export_format_argument == 'tflite':
-            output_path = output_path.replace('.tflite', f'-int8.tflite')
+            output_path = output_path.replace('.tflite', '-int8.tflite')
         elif export_format_argument == 'edgetpu':
-            output_path = output_path.replace('.tflite', f'-int8_edgetpu.tflite')
+            output_path = output_path.replace('.tflite', '-int8_edgetpu.tflite')
         if os.path.exists(output_path):
             if os.path.isdir(output_path):
                 shutil.rmtree(output_path, onerror=del_rw)
@@ -53,6 +53,7 @@ def cleanup(weights):
 # Utils
 # ---------------------
 
+
 def del_rw(action, file_path, exc):
     os.chmod(file_path, stat.S_IWRITE)
     os.remove(file_path)
@@ -60,7 +61,7 @@ def del_rw(action, file_path, exc):
 
 def gpu_export_formats():
     formats = export_formats()
-    return formats[formats['GPU'] == True].values.tolist()
+    return formats[formats['GPU']].values.tolist()
 
 
 def cpu_export_formats() -> t.List:
@@ -69,15 +70,22 @@ def cpu_export_formats() -> t.List:
     Note that some of these require special environments to serialize.
     """
     formats = export_formats()
-    return formats[formats['Format'].isin(
-        ('ONNX', 'OpenVINO', 'CoreML', 'TensorFlow SavedModel', 'TensorFlow GraphDef',
-        'TensorFlow Lite', 'TensorFlow Edge TPU', 'TensorFlow.js',)
-    )].values.tolist()
+    return formats[formats['Format'].isin((
+        'ONNX',
+        'OpenVINO',
+        'CoreML',
+        'TensorFlow SavedModel',
+        'TensorFlow GraphDef',
+        'TensorFlow Lite',
+        'TensorFlow Edge TPU',
+        'TensorFlow.js',
+    ))].values.tolist()
 
 
 # Tests
 # ----------------------
 
+
 def test_model_exists(weights: str):
     """
     Raise an error if model in specified path does not exist
@@ -125,9 +133,9 @@ def test_export_cpu(weights, export_format_row: t.List):
         assert file_count > 0, 'Folder is empty'
     else:
         if export_format_argument == 'tflite':
-            output_path = weights.replace('.tflite', f'-int8.tflite')
+            output_path = weights.replace('.tflite', '-int8.tflite')
         elif export_format_argument == 'edgetpu':
-            output_path = weights.replace('.tflite', f'-int8_edgetpu.tflite')
+            output_path = weights.replace('.tflite', '-int8_edgetpu.tflite')
         assert os.path.exists(output_path), f'Failed to serialize "{output_path}".'
 
     # TODO: we can add new tests to check mAP of the exported model on VOC dataset

From cda6cc3898ddeb1b8c58084990991e74eae4feb4 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Sat, 21 May 2022 11:04:20 +0000
Subject: [PATCH 03/15] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 tests/conftest.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/conftest.py b/tests/conftest.py
index 6af0fbb47151..cd3383cd4c9b 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -1,4 +1,3 @@
-
 _REQUIRED_ARGUMENTS = ('weights',)
 
 

From 8756d6a34e4de899dcfc7da1c91b987836cc94ba Mon Sep 17 00:00:00 2001
From: Jay Lee <ljay189@gmail.com>
Date: Sat, 21 May 2022 20:20:51 +0900
Subject: [PATCH 04/15] Merge dependency installation into previous workflow
 step

---
 .github/workflows/ci-testing.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/ci-testing.yml b/.github/workflows/ci-testing.yml
index 0bf7fca53914..eb0e9483d152 100644
--- a/.github/workflows/ci-testing.yml
+++ b/.github/workflows/ci-testing.yml
@@ -94,7 +94,7 @@ jobs:
 
       - name: install pytest dependencies
         run: |
-          pip install -r requirements.txt coremltools onnx onnx-simplifier onnxruntime openvino-dev tensorflow-cpu
+          pip install coremltools onnx onnx-simplifier onnxruntime openvino-dev tensorflow-cpu tensorflowjs --user
         shell: bash
 
       - name: Run pytest

From b2f658b40b826e5c9fe44c5908023a5506ee3caf Mon Sep 17 00:00:00 2001
From: Jay Lee <ljay189@gmail.com>
Date: Sat, 21 May 2022 23:20:44 +0900
Subject: [PATCH 05/15] commented out openvino test due to compatibility issues
 between OpenVINO and Tensorflowjs

---
 .github/workflows/ci-testing.yml | 19 ++++---------------
 tests/test_export.py             | 13 ++++---------
 2 files changed, 8 insertions(+), 24 deletions(-)

diff --git a/.github/workflows/ci-testing.yml b/.github/workflows/ci-testing.yml
index eb0e9483d152..3422d205fbe4 100644
--- a/.github/workflows/ci-testing.yml
+++ b/.github/workflows/ci-testing.yml
@@ -50,8 +50,9 @@ jobs:
       - name: Install dependencies
         run: |
           python -m pip install --upgrade pip
-          pip install -qr requirements.txt -f https://download.pytorch.org/whl/cpu/torch_stable.html \
-            onnx tensorflow-cpu  # wandb
+          # tensorflowjs for unit test
+          pip install -qr requirements.txt -f https://download.pytorch.org/whl/cpu/torch_stable.html tensorflowjs \
+            onnx tensorflow-cpu # wandb
           python --version
           pip --version
           pip list
@@ -83,7 +84,7 @@ jobs:
           # Export
           python models/yolo.py --cfg ${{ matrix.model }}.yaml  # build PyTorch model
           python models/tf.py --weights ${{ matrix.model }}.pt  # build TensorFlow model
-          python export.py --weights ${{ matrix.model }}.pt --img 64 --include torchscript onnx  # export
+          pytest tests --weights $weights
           # Python
           python - <<EOF
           import torch
@@ -91,15 +92,3 @@ jobs:
           EOF
 
         shell: bash
-
-      - name: install pytest dependencies
-        run: |
-          pip install coremltools onnx onnx-simplifier onnxruntime openvino-dev tensorflow-cpu tensorflowjs --user
-        shell: bash
-
-      - name: Run pytest
-        run: |
-          # Weights should be available from previous workflow
-          weights=runs/train/exp/weights/best.pt
-          pytest tests --weights $weights
-        shell: bash
diff --git a/tests/test_export.py b/tests/test_export.py
index 191bb8d9f251..67c012801d8b 100644
--- a/tests/test_export.py
+++ b/tests/test_export.py
@@ -72,7 +72,10 @@ def cpu_export_formats() -> t.List:
     formats = export_formats()
     return formats[formats['Format'].isin((
         'ONNX',
-        'OpenVINO',
+        # Numpy version mismatch between
+        # OpenVINO and tfjs where OpenVINO requires numpy 1.20
+        # and tfjs requires > 1.20
+        # 'OpenVINO',
         'CoreML',
         'TensorFlow SavedModel',
         'TensorFlow GraphDef',
@@ -107,14 +110,6 @@ def test_export_cpu(weights, export_format_row: t.List):
     # make img small for quick tests
     img_sz = (160, 160)
 
-    # As of now, openvino requires numpy < 1.20.
-    # numpy will be downgraded during openvino run
-    # so we need to re-upgrade numpy
-    if export_format_argument == 'openvino':
-        subprocess.run('pip install numpy==1.19.5', shell=True)
-    elif export_format_argument == 'tfjs':
-        subprocess.run('pip install --upgrade numpy', shell=True)
-
     # create the model
     run(weights=weights, imgsz=img_sz, include=(export_format_argument,), int8=True)
     output_path = weights.replace('.pt', suffix.lower())

From 75252151fee70b3b6a56c096af70019729e98e18 Mon Sep 17 00:00:00 2001
From: Jay Lee <ljay189@gmail.com>
Date: Mon, 23 May 2022 14:28:10 +0900
Subject: [PATCH 06/15] Revert all changes made in current branch

---
 .github/workflows/ci-testing.yml |   7 +-
 requirements.txt                 |   3 -
 tests/conftest.py                |   6 --
 tests/test_export.py             | 143 -------------------------------
 4 files changed, 3 insertions(+), 156 deletions(-)
 delete mode 100644 tests/conftest.py
 delete mode 100644 tests/test_export.py

diff --git a/.github/workflows/ci-testing.yml b/.github/workflows/ci-testing.yml
index 3422d205fbe4..e5d5fc434f06 100644
--- a/.github/workflows/ci-testing.yml
+++ b/.github/workflows/ci-testing.yml
@@ -50,9 +50,8 @@ jobs:
       - name: Install dependencies
         run: |
           python -m pip install --upgrade pip
-          # tensorflowjs for unit test
-          pip install -qr requirements.txt -f https://download.pytorch.org/whl/cpu/torch_stable.html tensorflowjs \
-            onnx tensorflow-cpu # wandb
+          pip install -qr requirements.txt -f https://download.pytorch.org/whl/cpu/torch_stable.html \
+            onnx tensorflow-cpu  # wandb
           python --version
           pip --version
           pip list
@@ -84,7 +83,7 @@ jobs:
           # Export
           python models/yolo.py --cfg ${{ matrix.model }}.yaml  # build PyTorch model
           python models/tf.py --weights ${{ matrix.model }}.pt  # build TensorFlow model
-          pytest tests --weights $weights
+          python export.py --weights ${{ matrix.model }}.pt --img 64 --include torchscript onnx  # export
           # Python
           python - <<EOF
           import torch
diff --git a/requirements.txt b/requirements.txt
index fbe0ef1e6820..4cf22b7093b4 100755
--- a/requirements.txt
+++ b/requirements.txt
@@ -20,9 +20,6 @@ tensorboard>=2.4.1
 pandas>=1.1.4
 seaborn>=0.11.0
 
-# Test ----------------------------------------
-pytest
-
 # Export --------------------------------------
 # coremltools>=4.1  # CoreML export
 # onnx>=1.9.0  # ONNX export
diff --git a/tests/conftest.py b/tests/conftest.py
deleted file mode 100644
index cd3383cd4c9b..000000000000
--- a/tests/conftest.py
+++ /dev/null
@@ -1,6 +0,0 @@
-_REQUIRED_ARGUMENTS = ('weights',)
-
-
-def pytest_addoption(parser):
-    for argument in _REQUIRED_ARGUMENTS:
-        parser.addoption(f'--{argument}', default=None)
diff --git a/tests/test_export.py b/tests/test_export.py
deleted file mode 100644
index 67c012801d8b..000000000000
--- a/tests/test_export.py
+++ /dev/null
@@ -1,143 +0,0 @@
-"""
-Tests intended to run on CI to ensure that models are being correctly serialized.
-To run the tests, first install the requirements by typing in:
-pip install -r requirements.txt
-Afterwards, from the project's root, type in:
-pytest tests --weights="yolov5s.pt"
-Check out the pytest website for more information
-"""
-import os
-import shutil
-import stat
-import subprocess
-import sys
-import typing as t
-from pathlib import Path
-
-import pytest
-import torch
-
-FILE = Path(__file__).resolve()
-ROOT = FILE.parents[1]  # YOLOv5 root directory
-if str(ROOT) not in sys.path:
-    sys.path.append(str(ROOT))  # add ROOT to PATH
-
-from export import export_formats, run
-
-# Fixtures
-# ----------------------
-
-
-@pytest.fixture(scope='session')
-def weights(pytestconfig):
-    return pytestconfig.getoption('weights')
-
-
-@pytest.fixture(scope='session')
-def cleanup(weights):
-    yield
-    for _, export_format_argument, suffix, ___ in cpu_export_formats():
-        output_path = weights.replace('.pt', suffix.lower())
-        if export_format_argument == 'tflite':
-            output_path = output_path.replace('.tflite', '-int8.tflite')
-        elif export_format_argument == 'edgetpu':
-            output_path = output_path.replace('.tflite', '-int8_edgetpu.tflite')
-        if os.path.exists(output_path):
-            if os.path.isdir(output_path):
-                shutil.rmtree(output_path, onerror=del_rw)
-            else:
-                os.chmod(output_path, stat.S_IWRITE)
-                os.remove(output_path)
-
-
-# Utils
-# ---------------------
-
-
-def del_rw(action, file_path, exc):
-    os.chmod(file_path, stat.S_IWRITE)
-    os.remove(file_path)
-
-
-def gpu_export_formats():
-    formats = export_formats()
-    return formats[formats['GPU']].values.tolist()
-
-
-def cpu_export_formats() -> t.List:
-    """
-    Get list of models that can be exported without gpu.
-    Note that some of these require special environments to serialize.
-    """
-    formats = export_formats()
-    return formats[formats['Format'].isin((
-        'ONNX',
-        # Numpy version mismatch between
-        # OpenVINO and tfjs where OpenVINO requires numpy 1.20
-        # and tfjs requires > 1.20
-        # 'OpenVINO',
-        'CoreML',
-        'TensorFlow SavedModel',
-        'TensorFlow GraphDef',
-        'TensorFlow Lite',
-        'TensorFlow Edge TPU',
-        'TensorFlow.js',
-    ))].values.tolist()
-
-
-# Tests
-# ----------------------
-
-
-def test_model_exists(weights: str):
-    """
-    Raise an error if model in specified path does not exist
-    Args:
-        weights: The path to yolov5 weight
-    """
-    assert weights is not None, 'Please specify --weights when running pytest.'
-    assert weights.endswith('.pt'), f'weights must end with ".pt". Passed in: {weights}'
-    assert os.path.exists(weights), f'Weights could not be found in: "{weights}"'
-
-
-@pytest.mark.usefixtures('cleanup')
-@pytest.mark.parametrize('export_format_row', cpu_export_formats())
-def test_export_cpu(weights, export_format_row: t.List):
-    _, export_format_argument, suffix, ___ = export_format_row
-    if export_format_argument in ('engine', 'coreml'):
-        pytest.skip(f'Export format: "{export_format_argument}" requires special environment. Skipping.')
-
-    # make img small for quick tests
-    img_sz = (160, 160)
-
-    # create the model
-    run(weights=weights, imgsz=img_sz, include=(export_format_argument,), int8=True)
-    output_path = weights.replace('.pt', suffix.lower())
-
-    if os.path.isdir(output_path):
-        # For now, we do a simple check to see whether files are not empty
-        directory = os.fsencode(output_path)
-        file_count = 0
-        for subdir, dirs, files in os.walk(directory):
-            for file in files:
-                file_path = os.path.join(subdir, file)
-                file_count += 1
-                file_is_not_empty = os.stat(file_path).st_size > 0
-                assert file_is_not_empty, f'File: "{file_path}" should not be empty.'
-        # Serialized folder should contain at least one file
-        assert file_count > 0, 'Folder is empty'
-    else:
-        if export_format_argument == 'tflite':
-            output_path = weights.replace('.tflite', '-int8.tflite')
-        elif export_format_argument == 'edgetpu':
-            output_path = weights.replace('.tflite', '-int8_edgetpu.tflite')
-        assert os.path.exists(output_path), f'Failed to serialize "{output_path}".'
-
-    # TODO: we can add new tests to check mAP of the exported model on VOC dataset
-
-
-@pytest.mark.skipif(not torch.cuda.is_available(), reason='Test requires cuda')
-@pytest.mark.parametrize('export_format_row', gpu_export_formats())
-def test_export_gpu(export_format_row: t.List):
-    # TODO: Test when runner with GPU is available
-    pass

From e9343fa3ba92483976593f449095778cf67f7d00 Mon Sep 17 00:00:00 2001
From: Jay Lee <ljay189@gmail.com>
Date: Mon, 23 May 2022 17:36:34 +0900
Subject: [PATCH 07/15] Added hard-fail support to enforce hard-failure mode
 and mAP threshold assertions

---
 .github/workflows/ci-benchmarking.yml |  66 ++++++++++++++
 data/coco128.yaml                     |  18 ++++
 utils/benchmarks.py                   | 123 +++++++++++++++++++++-----
 3 files changed, 187 insertions(+), 20 deletions(-)
 create mode 100644 .github/workflows/ci-benchmarking.yml

diff --git a/.github/workflows/ci-benchmarking.yml b/.github/workflows/ci-benchmarking.yml
new file mode 100644
index 000000000000..849faa649c8f
--- /dev/null
+++ b/.github/workflows/ci-benchmarking.yml
@@ -0,0 +1,66 @@
+# YOLOv5 🚀 by Ultralytics, GPL-3.0 license
+
+name: CI Benchmarking
+
+on: # https://help.github.com/en/actions/reference/events-that-trigger-workflows
+  push:
+    branches: [ master ]
+  pull_request:
+    # The branches below must be a subset of the branches above
+    branches: [ master ]
+  schedule:
+    - cron: '0 0 * * *'  # Runs at 00:00 UTC every day
+
+jobs:
+  cpu-tests:
+
+    runs-on: ${{ matrix.os }}
+    strategy:
+      fail-fast: true
+      matrix:
+        os: [ ubuntu-latest ]
+        python-version: [ 3.9 ]
+        model: [ 'yolov5n', 'yolov5s' ]  # models to test
+
+    # Timeout: https://stackoverflow.com/a/59076067/4521646
+    timeout-minutes: 60
+    steps:
+      - uses: actions/checkout@v3
+      - name: Set up Python ${{ matrix.python-version }}
+        uses: actions/setup-python@v3
+        with:
+          python-version: ${{ matrix.python-version }}
+
+      # Note: This uses an internal pip API and may not always work
+      # https://github.com/actions/cache/blob/master/examples.md#multiple-oss-in-a-workflow
+      - name: Get pip cache
+        id: pip-cache
+        run: |
+          python -c "from pip._internal.locations import USER_CACHE_DIR; print('::set-output name=dir::' + USER_CACHE_DIR)"
+
+      - name: Cache pip
+        uses: actions/cache@v3
+        with:
+          path: ${{ steps.pip-cache.outputs.dir }}
+          key: ${{ runner.os }}-${{ matrix.python-version }}-pip-${{ hashFiles('requirements.txt') }}
+          restore-keys: |
+            ${{ runner.os }}-${{ matrix.python-version }}-pip-
+
+      # Known Keras 2.7.0 issue: https://github.com/ultralytics/yolov5/pull/5486
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install -qr requirements.txt -f https://download.pytorch.org/whl/cpu/torch_stable.html \
+            onnx tensorflow-cpu  # wandb
+          python --version
+          pip --version
+          pip list
+        shell: bash
+
+      - name: Run benchmarking
+        run: |
+          weights=runs/train/exp/weights/best.pt
+          # benchmarking. Set --hard-fail to catch errors when mAP not above certain threshold
+          python utils/benchmarks.py --hard-fail
+
+        shell: bash
diff --git a/data/coco128.yaml b/data/coco128.yaml
index 2517d2079257..ebcd5b27c47c 100644
--- a/data/coco128.yaml
+++ b/data/coco128.yaml
@@ -28,3 +28,21 @@ names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus', 'train', 't
 
 # Download script/URL (optional)
 download: https://ultralytics.com/assets/coco128.zip
+
+# Benchmark values
+benchmarks:
+  # metrics E.g. mAP
+  mAP:
+    # Img size 640
+    yolov5n: 0.45
+    yolov5s: 0.45
+    yolov5m: 0.45
+    yolov5l: 0.45
+    yolov5x: 0.45
+
+    # Img size 1280
+    yolov5n6: 50
+    yolov5s6: 50
+    yolov5m6: 60
+    yolov5l6: 60
+    yolov5x6: 60
diff --git a/utils/benchmarks.py b/utils/benchmarks.py
index c3636b9e4df4..c349df3fd71a 100644
--- a/utils/benchmarks.py
+++ b/utils/benchmarks.py
@@ -28,9 +28,11 @@
 import argparse
 import sys
 import time
+import typing as t
 from pathlib import Path
 
 import pandas as pd
+import yaml
 
 FILE = Path(__file__).resolve()
 ROOT = FILE.parents[1]  # YOLOv5 root directory
@@ -45,6 +47,80 @@
 from utils.torch_utils import select_device
 
 
+class ThresholdError(Exception):
+    pass
+
+
+def get_benchmark_threshold_value(data_path: str, model_name: str) -> t.Union[float, int, None]:
+    """
+    Given the path to the data configurations and target model name,
+    retrieve the target benchmark value
+    Args:
+        data_path: The location of the data configuration file. e.g. data/coco128.yaml
+        model_name: The name of the model. E.g. yolov5s, yolov5n, etc
+
+    Returns:
+        The target threshold metric value. E.g. 50 (mAP)
+    """
+    with open(data_path) as f:
+        dataset_dict = yaml.safe_load(f)
+        if 'benchmarks' in dataset_dict and 'mAP' in dataset_dict['benchmarks']:
+            LOGGER.info(f'Attempting to find benchmark threshold for: {dataset_dict["download"]}')
+            # yolov5s, yolov5n, etc.
+            map_dict = dataset_dict['benchmarks']['mAP']
+            if model_name not in map_dict:
+                raise ValueError(f'Cannot find benchmark threshold for model: {model_name} in {data_path}')
+
+            map_benchmark_threshold = map_dict[model_name]
+
+            if not 0 <= map_benchmark_threshold <= 1:
+                raise ValueError('Please specify a mAP between 0 and 1.0')
+
+            return map_benchmark_threshold
+
+
+def get_unsupported_formats(unsupported_arguments: t.Tuple = ('edgetpu', 'tfjs', 'engine', 'coreml')) -> t.Tuple:
+    # coreml: Exception: Model prediction is only supported on macOS version 10.13 or later.
+    # engine: Requires gpu and docker container with TensorRT dependencies to run
+    # tfjs: Conflict with openvino numpy version (openvino < 1.20, tfjs >= 1.20)
+    # edgetpu: requires coral board, cloud tpu or some other external tpu
+    export_formats = export.export_formats()
+    unsupported = export_formats[export_formats['Argument'].isin(unsupported_arguments)].iloc[:, 1].values.tolist()
+    return tuple(unsupported)
+
+
+def get_benchmark_values(
+    name,  # export format name
+    f,  # file format
+    suffix,  # suffix of file format. E.g. '.pt', '.tflite', etc.
+    gpu,  # run on GPU (boolean value)
+    weights,  # weights path
+    data,  # data path
+    imgsz,  # image size: Two-tuple
+    half,  # use FP16 half-precision inference
+    batch_size,  # batch size
+    device,
+) -> t.List:
+    assert f not in get_unsupported_formats(), f'{name} not supported'
+    if device.type != 'cpu':
+        assert gpu, f'{name} inference not supported on GPU'
+
+    # Export
+    if f == '-':
+        w = weights  # PyTorch format
+    else:
+        w = export.run(weights=weights, imgsz=[imgsz], include=[f], device=device, half=half)[-1]  # all others
+    assert suffix in str(w), 'export failed'
+
+    # Validate
+    result = val.run(data, w, batch_size, imgsz, plots=False, device=device, task='benchmark', half=half)
+    metrics = result[0]  # metrics (mp, mr, map50, map, *losses(box, obj, cls))
+    speeds = result[2]  # times (preprocess, inference, postprocess)
+    mAP, t_inference = round(metrics[3], 4), round(speeds[1], 2)
+    # assert mA
+    return [name, mAP, t_inference]
+
+
 def run(
         weights=ROOT / 'yolov5s.pt',  # weights path
         imgsz=640,  # inference size (pixels)
@@ -54,32 +130,33 @@ def run(
         half=False,  # use FP16 half-precision inference
         test=False,  # test exports only
         pt_only=False,  # test PyTorch only
+        hard_fail=False,  # Raise errors if model fails to export or mAP lower than target threshold
 ):
     y, t = [], time.time()
     formats = export.export_formats()
     device = select_device(device)
+    # Grab benchmark threshold value
+    model_name = str(weights).split('/')[-1].split('.')[0]
+    map_benchmark_threshold = get_benchmark_threshold_value(str(data), model_name)
+
     for i, (name, f, suffix, gpu) in formats.iterrows():  # index, (name, file, suffix, gpu-capable)
-        try:
-            assert i != 9, 'Edge TPU not supported'
-            assert i != 10, 'TF.js not supported'
-            if device.type != 'cpu':
-                assert gpu, f'{name} inference not supported on GPU'
-
-            # Export
-            if f == '-':
-                w = weights  # PyTorch format
-            else:
-                w = export.run(weights=weights, imgsz=[imgsz], include=[f], device=device, half=half)[-1]  # all others
-            assert suffix in str(w), 'export failed'
+        if hard_fail:
+            if f in get_unsupported_formats():
+                continue
+            # skip unsupported
+            benchmarks = get_benchmark_values(name, f, suffix, gpu, weights, data, imgsz, half, batch_size, device)
+            y.append(benchmarks)
+            name, mAP, t_inference = benchmarks
+            if map_benchmark_threshold and mAP < map_benchmark_threshold:
+                raise ThresholdError(f'mAP value: {mAP} is below threshold value: {map_benchmark_threshold}')
+        else:
+            try:
+                y.append(get_benchmark_values(name, f, suffix, gpu, weights, data, imgsz, half, batch_size, device))
+            except Exception as e:
+                LOGGER.warning(f'WARNING: Benchmark failure for {name}: {e}')
+                benchmarks = [name, None, None]
+                y.append(benchmarks)  # mAP, t_inference
 
-            # Validate
-            result = val.run(data, w, batch_size, imgsz, plots=False, device=device, task='benchmark', half=half)
-            metrics = result[0]  # metrics (mp, mr, map50, map, *losses(box, obj, cls))
-            speeds = result[2]  # times (preprocess, inference, postprocess)
-            y.append([name, round(metrics[3], 4), round(speeds[1], 2)])  # mAP, t_inference
-        except Exception as e:
-            LOGGER.warning(f'WARNING: Benchmark failure for {name}: {e}')
-            y.append([name, None, None])  # mAP, t_inference
         if pt_only and i == 0:
             break  # break after PyTorch
 
@@ -102,6 +179,7 @@ def test(
         half=False,  # use FP16 half-precision inference
         test=False,  # test exports only
         pt_only=False,  # test PyTorch only
+        hard_fail=False  # Raise errors if model fails to export or mAP lower than target threshold
 ):
     y, t = [], time.time()
     formats = export.export_formats()
@@ -135,6 +213,11 @@ def parse_opt():
     parser.add_argument('--half', action='store_true', help='use FP16 half-precision inference')
     parser.add_argument('--test', action='store_true', help='test exports only')
     parser.add_argument('--pt-only', action='store_true', help='test PyTorch only')
+    parser.add_argument('--hard-fail',
+                        action='store_true',
+                        help='Use to raise errors if conditions are met. '
+                        'Also asserts that exported model mAP lies above '
+                        'user-defined thresholds.')
     opt = parser.parse_args()
     print_args(vars(opt))
     return opt

From de8b35b9b22a019c2891bfa117eb11a5fe480e1e Mon Sep 17 00:00:00 2001
From: Jay Lee <ljay189@gmail.com>
Date: Mon, 23 May 2022 18:26:32 +0900
Subject: [PATCH 08/15] Added comments for unsupported formats

---
 .github/workflows/ci-benchmarking.yml | 30 +++++++++++++--------------
 utils/benchmarks.py                   | 10 +++++++--
 2 files changed, 23 insertions(+), 17 deletions(-)

diff --git a/.github/workflows/ci-benchmarking.yml b/.github/workflows/ci-benchmarking.yml
index 849faa649c8f..78d0a43a72ba 100644
--- a/.github/workflows/ci-benchmarking.yml
+++ b/.github/workflows/ci-benchmarking.yml
@@ -31,20 +31,20 @@ jobs:
         with:
           python-version: ${{ matrix.python-version }}
 
-      # Note: This uses an internal pip API and may not always work
-      # https://github.com/actions/cache/blob/master/examples.md#multiple-oss-in-a-workflow
-      - name: Get pip cache
-        id: pip-cache
-        run: |
-          python -c "from pip._internal.locations import USER_CACHE_DIR; print('::set-output name=dir::' + USER_CACHE_DIR)"
-
-      - name: Cache pip
-        uses: actions/cache@v3
-        with:
-          path: ${{ steps.pip-cache.outputs.dir }}
-          key: ${{ runner.os }}-${{ matrix.python-version }}-pip-${{ hashFiles('requirements.txt') }}
-          restore-keys: |
-            ${{ runner.os }}-${{ matrix.python-version }}-pip-
+#      # Note: This uses an internal pip API and may not always work
+#      # https://github.com/actions/cache/blob/master/examples.md#multiple-oss-in-a-workflow
+#      - name: Get pip cache
+#        id: pip-cache
+#        run: |
+#          python -c "from pip._internal.locations import USER_CACHE_DIR; print('::set-output name=dir::' + USER_CACHE_DIR)"
+#
+#      - name: Cache pip
+#        uses: actions/cache@v3
+#        with:
+#          path: ${{ steps.pip-cache.outputs.dir }}
+#          key: ${{ runner.os }}-${{ matrix.python-version }}-pip-${{ hashFiles('requirements.txt') }}
+#          restore-keys: |
+#            ${{ runner.os }}-${{ matrix.python-version }}-pip-
 
       # Known Keras 2.7.0 issue: https://github.com/ultralytics/yolov5/pull/5486
       - name: Install dependencies
@@ -60,7 +60,7 @@ jobs:
       - name: Run benchmarking
         run: |
           weights=runs/train/exp/weights/best.pt
-          # benchmarking. Set --hard-fail to catch errors when mAP not above certain threshold
+          # benchmarking. Set --hard-fail to catch errors including when mAP not above certain threshold
           python utils/benchmarks.py --hard-fail
 
         shell: bash
diff --git a/utils/benchmarks.py b/utils/benchmarks.py
index c349df3fd71a..baebc6219111 100644
--- a/utils/benchmarks.py
+++ b/utils/benchmarks.py
@@ -60,7 +60,7 @@ def get_benchmark_threshold_value(data_path: str, model_name: str) -> t.Union[fl
         model_name: The name of the model. E.g. yolov5s, yolov5n, etc
 
     Returns:
-        The target threshold metric value. E.g. 50 (mAP)
+        The target threshold metric value. E.g. 0.5 (mAP)
     """
     with open(data_path) as f:
         dataset_dict = yaml.safe_load(f)
@@ -166,7 +166,13 @@ def run(
     notebook_init()  # print system info
     py = pd.DataFrame(y, columns=['Format', 'mAP@0.5:0.95', 'Inference time (ms)'] if map else ['Format', 'Export', ''])
     LOGGER.info(f'\nBenchmarks complete ({time.time() - t:.2f}s)')
-    LOGGER.info(str(py if map else py.iloc[:, :2]))
+    # pandas dataframe printing fails in CI with the following error
+    # ModuleNotFoundError: No module named 'pandas.io.formats.string'
+    try:
+        LOGGER.info(str(py if map else py.iloc[:, :2]))
+    except Exception:
+        pretty_formatted_list = '\n'.join(['\t'.join([str(cell) for cell in row]) for row in py.values.tolist()])
+        LOGGER.info(pretty_formatted_list)
     return py
 
 

From 987cc3dad610e40c6037c8c66c4f5a3c19c50619 Mon Sep 17 00:00:00 2001
From: jaewon <jaewon.lee@deepingsource.io>
Date: Tue, 24 May 2022 14:01:21 +0900
Subject: [PATCH 09/15] Added sanity check for unsupported formats to minimize
 bugs from typos and other human error

---
 utils/benchmarks.py | 24 +++++++++++++++++++++---
 1 file changed, 21 insertions(+), 3 deletions(-)

diff --git a/utils/benchmarks.py b/utils/benchmarks.py
index baebc6219111..0a9b94e71f2d 100644
--- a/utils/benchmarks.py
+++ b/utils/benchmarks.py
@@ -79,14 +79,28 @@ def get_benchmark_threshold_value(data_path: str, model_name: str) -> t.Union[fl
             return map_benchmark_threshold
 
 
-def get_unsupported_formats(unsupported_arguments: t.Tuple = ('edgetpu', 'tfjs', 'engine', 'coreml')) -> t.Tuple:
+def get_unsupported_formats() -> t.Tuple:
     # coreml: Exception: Model prediction is only supported on macOS version 10.13 or later.
     # engine: Requires gpu and docker container with TensorRT dependencies to run
     # tfjs: Conflict with openvino numpy version (openvino < 1.20, tfjs >= 1.20)
     # edgetpu: requires coral board, cloud tpu or some other external tpu
+    return 'edgetpu', 'tfjs', 'engine', 'coreml'
+
+
+def check_if_formats_exist(unsupported_arguments: t.Tuple):
+    """
+    Check to see if the formats actually exists under export_formats().
+    An error will be thrown if the argument type does not exist
+    Args:
+        unsupported_arguments: A tuple of unsupported export formats
+    """
     export_formats = export.export_formats()
-    unsupported = export_formats[export_formats['Argument'].isin(unsupported_arguments)].iloc[:, 1].values.tolist()
-    return tuple(unsupported)
+    valid_export_format_arguments = set(export_formats.Argument)
+    for unsupported_arg in unsupported_arguments:
+        if unsupported_arg not in valid_export_format_arguments:
+            raise ValueError(f'Argument: "{unsupported_arg}" is not a valid export format.\n'
+                             f'Valid export formats: {", ".join(valid_export_format_arguments)[: -1]}. \n'
+                             f'See export.export_formats() for more info.')
 
 
 def get_benchmark_values(
@@ -139,6 +153,10 @@ def run(
     model_name = str(weights).split('/')[-1].split('.')[0]
     map_benchmark_threshold = get_benchmark_threshold_value(str(data), model_name)
 
+    # get unsupported formats and check if they exist under exports.get_exports()
+    check_if_formats_exist(get_unsupported_formats())
+    # check
+
     for i, (name, f, suffix, gpu) in formats.iterrows():  # index, (name, file, suffix, gpu-capable)
         if hard_fail:
             if f in get_unsupported_formats():

From 2d7277ee11ebcce68d93b3112249e4c41b209e96 Mon Sep 17 00:00:00 2001
From: jaewon <jaewon.lee@deepingsource.io>
Date: Tue, 24 May 2022 14:27:44 +0900
Subject: [PATCH 10/15] Minor cleanup

---
 utils/benchmarks.py | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/utils/benchmarks.py b/utils/benchmarks.py
index 0a9b94e71f2d..84a6b32324d3 100644
--- a/utils/benchmarks.py
+++ b/utils/benchmarks.py
@@ -87,7 +87,7 @@ def get_unsupported_formats() -> t.Tuple:
     return 'edgetpu', 'tfjs', 'engine', 'coreml'
 
 
-def check_if_formats_exist(unsupported_arguments: t.Tuple):
+def check_if_formats_exist(unsupported_arguments: t.Tuple) -> None:
     """
     Check to see if the formats actually exists under export_formats().
     An error will be thrown if the argument type does not exist
@@ -131,7 +131,6 @@ def get_benchmark_values(
     metrics = result[0]  # metrics (mp, mr, map50, map, *losses(box, obj, cls))
     speeds = result[2]  # times (preprocess, inference, postprocess)
     mAP, t_inference = round(metrics[3], 4), round(speeds[1], 2)
-    # assert mA
     return [name, mAP, t_inference]
 
 
@@ -155,13 +154,12 @@ def run(
 
     # get unsupported formats and check if they exist under exports.get_exports()
     check_if_formats_exist(get_unsupported_formats())
-    # check
 
     for i, (name, f, suffix, gpu) in formats.iterrows():  # index, (name, file, suffix, gpu-capable)
         if hard_fail:
             if f in get_unsupported_formats():
                 continue
-            # skip unsupported
+            # [name, mAP, t_inference]
             benchmarks = get_benchmark_values(name, f, suffix, gpu, weights, data, imgsz, half, batch_size, device)
             y.append(benchmarks)
             name, mAP, t_inference = benchmarks
@@ -173,7 +171,7 @@ def run(
             except Exception as e:
                 LOGGER.warning(f'WARNING: Benchmark failure for {name}: {e}')
                 benchmarks = [name, None, None]
-                y.append(benchmarks)  # mAP, t_inference
+                y.append(benchmarks)
 
         if pt_only and i == 0:
             break  # break after PyTorch

From b351824afc782bc7018cc80ac60d3c5f072a5ae4 Mon Sep 17 00:00:00 2001
From: jaewon <jaewon.lee@deepingsource.io>
Date: Tue, 24 May 2022 20:39:06 +0900
Subject: [PATCH 11/15] Added more realistic arbitrary mAP values

---
 data/coco128.yaml | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/data/coco128.yaml b/data/coco128.yaml
index ebcd5b27c47c..0880b5aa79c5 100644
--- a/data/coco128.yaml
+++ b/data/coco128.yaml
@@ -31,7 +31,7 @@ download: https://ultralytics.com/assets/coco128.zip
 
 # Benchmark values
 benchmarks:
-  # metrics E.g. mAP
+  # metrics E.g. mAP 0.5 : 0.95
   mAP:
     # Img size 640
     yolov5n: 0.45
@@ -41,8 +41,8 @@ benchmarks:
     yolov5x: 0.45
 
     # Img size 1280
-    yolov5n6: 50
-    yolov5s6: 50
-    yolov5m6: 60
-    yolov5l6: 60
-    yolov5x6: 60
+    yolov5n6: 0.5
+    yolov5s6: 0.5
+    yolov5m6: 0.55
+    yolov5l6: 0.6
+    yolov5x6: 0.6

From 4f07625533ee0dc2f7cc3996bed27eef7c6b6cc0 Mon Sep 17 00:00:00 2001
From: jaewon <jaewon.lee@deepingsource.io>
Date: Wed, 25 May 2022 18:59:45 +0900
Subject: [PATCH 12/15] Added weights argument to ci-benchmarking.yml. Changed
 yolov5n mAP 0.5 : 0.95 threshold to 0.35

---
 .github/workflows/ci-benchmarking.yml | 3 +--
 data/coco128.yaml                     | 2 +-
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/ci-benchmarking.yml b/.github/workflows/ci-benchmarking.yml
index 78d0a43a72ba..082ea74bdcbf 100644
--- a/.github/workflows/ci-benchmarking.yml
+++ b/.github/workflows/ci-benchmarking.yml
@@ -59,8 +59,7 @@ jobs:
 
       - name: Run benchmarking
         run: |
-          weights=runs/train/exp/weights/best.pt
           # benchmarking. Set --hard-fail to catch errors including when mAP not above certain threshold
-          python utils/benchmarks.py --hard-fail
+          python utils/benchmarks.py --weights ${{ matrix.model }}.pt --hard-fail
 
         shell: bash
diff --git a/data/coco128.yaml b/data/coco128.yaml
index 0880b5aa79c5..3b6f06f5024d 100644
--- a/data/coco128.yaml
+++ b/data/coco128.yaml
@@ -34,7 +34,7 @@ benchmarks:
   # metrics E.g. mAP 0.5 : 0.95
   mAP:
     # Img size 640
-    yolov5n: 0.45
+    yolov5n: 0.35
     yolov5s: 0.45
     yolov5m: 0.45
     yolov5l: 0.45

From 3bc0008919f363075a884cac93f42d67139719a3 Mon Sep 17 00:00:00 2001
From: jaewon <jaewon.lee@deepingsource.io>
Date: Wed, 25 May 2022 19:07:36 +0900
Subject: [PATCH 13/15] Lowered mAP threshold to 0.32 to pass CI test

---
 data/coco128.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/data/coco128.yaml b/data/coco128.yaml
index 3b6f06f5024d..7e8b6b9d2ce6 100644
--- a/data/coco128.yaml
+++ b/data/coco128.yaml
@@ -34,7 +34,7 @@ benchmarks:
   # metrics E.g. mAP 0.5 : 0.95
   mAP:
     # Img size 640
-    yolov5n: 0.35
+    yolov5n: 0.32
     yolov5s: 0.45
     yolov5m: 0.45
     yolov5l: 0.45

From 6e3eb86ff9efb9229935de4e7d4554b964fba526 Mon Sep 17 00:00:00 2001
From: Glenn Jocher <glenn.jocher@ultralytics.com>
Date: Fri, 27 May 2022 11:53:28 +0200
Subject: [PATCH 14/15] Delete ci-benchmarking.yml

---
 .github/workflows/ci-benchmarking.yml | 65 ---------------------------
 1 file changed, 65 deletions(-)
 delete mode 100644 .github/workflows/ci-benchmarking.yml

diff --git a/.github/workflows/ci-benchmarking.yml b/.github/workflows/ci-benchmarking.yml
deleted file mode 100644
index 082ea74bdcbf..000000000000
--- a/.github/workflows/ci-benchmarking.yml
+++ /dev/null
@@ -1,65 +0,0 @@
-# YOLOv5 🚀 by Ultralytics, GPL-3.0 license
-
-name: CI Benchmarking
-
-on: # https://help.github.com/en/actions/reference/events-that-trigger-workflows
-  push:
-    branches: [ master ]
-  pull_request:
-    # The branches below must be a subset of the branches above
-    branches: [ master ]
-  schedule:
-    - cron: '0 0 * * *'  # Runs at 00:00 UTC every day
-
-jobs:
-  cpu-tests:
-
-    runs-on: ${{ matrix.os }}
-    strategy:
-      fail-fast: true
-      matrix:
-        os: [ ubuntu-latest ]
-        python-version: [ 3.9 ]
-        model: [ 'yolov5n', 'yolov5s' ]  # models to test
-
-    # Timeout: https://stackoverflow.com/a/59076067/4521646
-    timeout-minutes: 60
-    steps:
-      - uses: actions/checkout@v3
-      - name: Set up Python ${{ matrix.python-version }}
-        uses: actions/setup-python@v3
-        with:
-          python-version: ${{ matrix.python-version }}
-
-#      # Note: This uses an internal pip API and may not always work
-#      # https://github.com/actions/cache/blob/master/examples.md#multiple-oss-in-a-workflow
-#      - name: Get pip cache
-#        id: pip-cache
-#        run: |
-#          python -c "from pip._internal.locations import USER_CACHE_DIR; print('::set-output name=dir::' + USER_CACHE_DIR)"
-#
-#      - name: Cache pip
-#        uses: actions/cache@v3
-#        with:
-#          path: ${{ steps.pip-cache.outputs.dir }}
-#          key: ${{ runner.os }}-${{ matrix.python-version }}-pip-${{ hashFiles('requirements.txt') }}
-#          restore-keys: |
-#            ${{ runner.os }}-${{ matrix.python-version }}-pip-
-
-      # Known Keras 2.7.0 issue: https://github.com/ultralytics/yolov5/pull/5486
-      - name: Install dependencies
-        run: |
-          python -m pip install --upgrade pip
-          pip install -qr requirements.txt -f https://download.pytorch.org/whl/cpu/torch_stable.html \
-            onnx tensorflow-cpu  # wandb
-          python --version
-          pip --version
-          pip list
-        shell: bash
-
-      - name: Run benchmarking
-        run: |
-          # benchmarking. Set --hard-fail to catch errors including when mAP not above certain threshold
-          python utils/benchmarks.py --weights ${{ matrix.model }}.pt --hard-fail
-
-        shell: bash

From 6b1e90a26f49363746a13cf9d76083e9a45cc5a6 Mon Sep 17 00:00:00 2001
From: Glenn Jocher <glenn.jocher@ultralytics.com>
Date: Fri, 27 May 2022 11:54:22 +0200
Subject: [PATCH 15/15] Update ci-testing.yml

---
 .github/workflows/ci-testing.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/ci-testing.yml b/.github/workflows/ci-testing.yml
index 14f93455fa46..0d822585bd7b 100644
--- a/.github/workflows/ci-testing.yml
+++ b/.github/workflows/ci-testing.yml
@@ -39,7 +39,7 @@ jobs:
           pip list
       - name: Run benchmarks
         run: |
-          python utils/benchmarks.py --weights ${{ matrix.model }}.pt --img 320
+          python utils/benchmarks.py --weights ${{ matrix.model }}.pt --img 320 --hard-fail
 
   Tests:
     timeout-minutes: 60