diff --git a/.github/workflows/cpp-tests-classification.yml b/.github/workflows/cpp-tests-classification.yml
new file mode 100644
index 0000000000..6d68bf3856
--- /dev/null
+++ b/.github/workflows/cpp-tests-classification.yml
@@ -0,0 +1,97 @@
+name: CPP Tests (GGML Classification)
+
+on:
+  workflow_dispatch:
+    inputs:
+      workdir:
+        description: "Working directory"
+        type: string
+        required: false
+        default: "packages/classification-ggml"
+  workflow_call:
+    inputs:
+      ref:
+        description: "Git ref to checkout"
+        type: string
+        required: false
+      repository:
+        description: "Repository to checkout"
+        type: string
+        required: false
+      workdir:
+        description: "Working directory"
+        type: string
+        required: false
+        default: "packages/classification-ggml"
+
+permissions:
+  contents: read
+
+jobs:
+  test-cpp:
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-22.04
+            platform: linux
+            arch: x64
+          - os: macos-15
+            platform: darwin
+            arch: arm64
+          - os: windows-2022
+            platform: win32
+            arch: x64
+
+    runs-on: ${{ matrix.os }}
+    environment: release
+    name: cpp-tests-${{ matrix.platform }}-${{ matrix.arch }}
+
+    env:
+      WORKDIR: ${{ inputs.workdir }}
+
+    steps:
+      - name: Setup build host
+        uses: tetherto/qvac/.github/actions/setup-build-host@1d9b2165867d03c6edd675e402ee101a5d48a6d8
+        with:
+          platform: ${{ matrix.platform }}
+          arch: ${{ matrix.arch }}
+
+      - name: Checkout repository
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+        with:
+          repository: ${{ inputs.repository || github.repository }}
+          ref: ${{ inputs.ref || github.ref }}
+          token: ${{ secrets.PAT_TOKEN }}
+
+      - name: Setup AWS + Windows CLI
+        uses: tetherto/qvac/.github/actions/setup-aws-prebuild@0bbdca93da303a0b1634ba14a89cec085621078d
+        with:
+          role-to-assume: ${{ secrets.AWS_OIDC_ROLE_ARN }}
+
+      - name: Setup vcpkg
+        uses: tetherto/qvac/.github/actions/setup-vcpkg@1d9b2165867d03c6edd675e402ee101a5d48a6d8
+        env:
+          MODEL_S3_BUCKET: ${{ secrets.MODEL_S3_BUCKET }}
+        with:
+          platform: ${{ matrix.platform }}
+          arch: ${{ matrix.arch }}
+
+      - name: Setup Bare tooling
+        uses: tetherto/qvac/.github/actions/setup-bare-tooling@0bbdca93da303a0b1634ba14a89cec085621078d
+
+      - name: Setup Apple Clang
+        if: ${{ matrix.platform == 'darwin' }}
+        uses: tetherto/qvac/.github/actions/setup-apple-clang@1d9b2165867d03c6edd675e402ee101a5d48a6d8
+
+      - name: Install npm dependencies
+        working-directory: ${{ env.WORKDIR }}
+        run: npm install --ignore-scripts
+
+      - name: Build C++ tests
+        working-directory: ${{ env.WORKDIR }}
+        run: npm run test:cpp:build
+
+      - name: Run C++ tests
+        working-directory: ${{ env.WORKDIR }}
+        run: npm run test:cpp:run
diff --git a/.github/workflows/integration-mobile-test-classification-ggml.yml b/.github/workflows/integration-mobile-test-classification-ggml.yml
new file mode 100644
index 0000000000..1b4362a6b0
--- /dev/null
+++ b/.github/workflows/integration-mobile-test-classification-ggml.yml
@@ -0,0 +1,1451 @@
+name: Mobile Integration Tests (GGML Classification)
+
+on:
+  workflow_call:
+    inputs:
+      ref:
+        description: "Git ref to checkout"
+        type: string
+        required: false
+      repository:
+        description: "Repository to checkout"
+        type: string
+        required: false
+  workflow_dispatch:
+    inputs:
+      ref:
+        description: "Git ref (branch/tag/SHA) to test"
+        type: string
+        required: false
+        default: main
+      package:
+        description: "Full NPM package spec to test (default: @qvac/classification-ggml@latest)"
+        type: string
+        required: true
+        default: "@qvac/classification-ggml@latest"
+
+env:
+  NODE_VERSION: "lts/*"
+  ADDON_NAME: "@qvac/classification-ggml"
+  PREBUILD_ARTIFACT_PREFIX: "classification-ggml-" # Matches `classification-ggml-${platform}-${arch}` artifact names produced by prebuilds-classification-ggml.yml (via reusable-prebuilds.yml)
+  TEST_FRAMEWORK_REF: "main" # Branch/tag of qvac-test-addon-mobile framework
+  APP_BUNDLE_ID: "io.tether.test.qvac" # Bundle ID for the test app (same for all addons)
+  ADDON_WORKDIR: "addon/packages/classification-ggml"
+
+jobs:
+  build-and-test:
+    name: Build ${{ matrix.platform }} and Run E2E Tests
+    environment: release
+    runs-on: ${{ matrix.runner }}
+    timeout-minutes: 120
+    continue-on-error: true # Don't block PR merges if tests fail
+    permissions:
+      contents: read
+      packages: read
+      pull-requests: write # Allow commenting on PRs
+      id-token: write
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - platform: Android
+            os: ubuntu-24.04
+            runner: ai-run-linux
+          - platform: iOS
+            os: macos-14
+            runner: macos-14
+
+    steps:
+      - name: Validate Dispatch Inputs
+        if: github.event_name == 'workflow_dispatch' && github.event.inputs.package
+        run: |
+          if [[ ! "${{ github.event.inputs.package }}" =~ ^@qvac/ ]]; then
+            echo "::error::Invalid package scope. Only @qvac/* is allowed."
+            exit 1
+          fi
+
+      # Free up disk space on Ubuntu runner to prevent "No space left on device" errors
+      - name: Free up disk space
+        if: matrix.platform == 'Android'
+        run: |
+          echo "Disk space before cleanup:"
+          df -h
+          # Remove unnecessary software to free up disk space (|| true to handle self-hosted runners)
+          sudo rm -rf /usr/share/dotnet || true
+          sudo rm -rf /opt/ghc || true
+          sudo rm -rf /opt/hostedtoolcache/CodeQL || true
+          sudo rm -rf /opt/hostedtoolcache/go || true
+          sudo rm -rf /opt/hostedtoolcache/Python || true
+          sudo rm -rf /opt/hostedtoolcache/Ruby || true
+          sudo rm -rf /usr/local/lib/android/sdk/ndk || true
+          sudo rm -rf /usr/local/share/boost || true
+          sudo rm -rf /usr/share/swift || true
+          sudo docker image prune --all --force || true
+          # Clean APT cache
+          sudo apt-get clean || true
+          echo "Disk space after cleanup:"
+          df -h
+
+      - name: Checkout addon repository
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+        with:
+          repository: ${{ inputs.repository || github.repository }}
+          ref: ${{ inputs.ref || github.ref }}
+          token: ${{ secrets.PAT_TOKEN }}
+          path: addon
+          fetch-depth: 0
+
+      - name: Checkout mobile test framework
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+        with:
+          repository: tetherto/qvac-test-addon-mobile
+          ref: ${{ env.TEST_FRAMEWORK_REF }}
+          token: ${{ secrets.PAT_TOKEN }}
+          path: test-framework
+          fetch-depth: 0
+
+      - name: Setup Node.js
+        uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # 6.3.0
+        with:
+          node-version: ${{ env.NODE_VERSION }}
+
+      - name: Install global dependencies
+        run: |
+          echo "Installing global dependencies..."
+          npm install -g @expo/cli@latest --ignore-scripts
+
+      - name: Download Android prebuilds (from artifacts)
+        if: matrix.platform == 'Android' && !inputs.package
+        uses: actions/download-artifact@3e5f45b2cfb9172054b4087a40e8e0b5a5461e7c # 8.0.1
+        with:
+          path: ${{ runner.temp }}/prebuilds-android-staging
+          pattern: ${{ env.PREBUILD_ARTIFACT_PREFIX }}android-*
+          merge-multiple: true
+
+      - name: Move Android prebuilds from staging
+        if: matrix.platform == 'Android' && !inputs.package
+        run: |
+          mkdir -p ${{ env.ADDON_WORKDIR }}/prebuilds
+          cp -r ${{ runner.temp }}/prebuilds-android-staging/* ${{ env.ADDON_WORKDIR }}/prebuilds/ 2>/dev/null || true
+        shell: bash
+        continue-on-error: true
+
+      - name: Download iOS prebuilds (from artifacts)
+        if: matrix.platform == 'iOS' && !inputs.package
+        uses: actions/download-artifact@3e5f45b2cfb9172054b4087a40e8e0b5a5461e7c # 8.0.1
+        with:
+          path: ${{ runner.temp }}/prebuilds-ios-staging
+          pattern: ${{ env.PREBUILD_ARTIFACT_PREFIX }}ios-*
+          merge-multiple: true
+
+      - name: Move iOS prebuilds from staging
+        if: matrix.platform == 'iOS' && !inputs.package
+        run: |
+          mkdir -p ${{ env.ADDON_WORKDIR }}/prebuilds
+          cp -r ${{ runner.temp }}/prebuilds-ios-staging/* ${{ env.ADDON_WORKDIR }}/prebuilds/ 2>/dev/null || true
+        shell: bash
+        continue-on-error: true
+
+      - name: Download prebuilds from package
+        if: inputs.package
+        working-directory: ${{ env.ADDON_WORKDIR }}
+        run: |
+          PACKAGE_SPEC="${{ inputs.package }}"
+          echo "📦 Downloading $PACKAGE_SPEC from npm for manual trigger..."
+
+          PACKAGE_NAME="${PACKAGE_SPEC%@*}"
+
+          if ! npm pack "$PACKAGE_SPEC" --ignore-scripts; then
+            echo "ERROR: Failed to download $PACKAGE_SPEC from npm"
+            echo "Please check that the package exists at https://www.npmjs.com/package/$PACKAGE_NAME"
+            exit 1
+          fi
+
+          # Extract the tarball (pattern matches any addon name)
+          tar -xzf *.tgz
+
+          # Validate prebuilds directory exists
+          if [ ! -d "package/prebuilds" ]; then
+            echo "ERROR: No prebuilds directory found in package"
+            echo "The downloaded package may not contain prebuilt binaries"
+            exit 1
+          fi
+
+          # Move prebuilds to expected location
+          mv package/prebuilds ./prebuilds
+
+          # Cleanup
+          rm -rf package *.tgz
+
+          echo "✅ Prebuilds downloaded from npm:"
+          ls -la prebuilds/
+
+      - name: Verify and prepare prebuilds
+        working-directory: ${{ env.ADDON_WORKDIR }}
+        run: |
+          echo "Checking for prebuilds..."
+          echo "Current directory: $(pwd)"
+          if [ -d "prebuilds" ] && [ "$(ls -A prebuilds)" ]; then
+            echo "✅ Prebuilds found from artifacts:"
+            ls -la prebuilds/
+          else
+            echo "❌ ERROR: No prebuilds found!"
+            echo "   This workflow requires prebuilds to be available."
+            echo "   Either:"
+            echo "   1. Run this workflow after prebuild job completes"
+            echo "   2. Or commit prebuilds to the repository"
+            exit 1
+          fi
+
+          # Copy mobile prebuilds if needed
+          if npm run mobile:copy-prebuilds 2>/dev/null; then
+            echo "✅ Mobile prebuilds prepared"
+          else
+            echo "⚠️  mobile:copy-prebuilds script not available or failed"
+          fi
+
+      - name: Remove desktop prebuilds to save disk space
+        working-directory: ${{ env.ADDON_WORKDIR }}
+        run: |
+          echo "Removing desktop prebuilds to save disk space (keeping Android + iOS)..."
+          echo "Before cleanup:"
+          du -sh prebuilds/* 2>/dev/null || true
+
+          # Remove desktop prebuilds only (not needed for mobile tests)
+          rm -rf prebuilds/darwin-* prebuilds/win32-* prebuilds/linux-* 2>/dev/null || true
+
+          echo "After cleanup (Android + iOS only):"
+          du -sh prebuilds/* 2>/dev/null || true
+          df -h
+
+      - name: Verify test files exist
+        working-directory: ${{ env.ADDON_WORKDIR }}
+        run: |
+          echo "Verifying addon has mobile tests..."
+
+          if [ ! -d "test/mobile" ]; then
+            echo "❌ ERROR: test/mobile directory not found!"
+            echo ""
+            echo "This workflow requires the addon to have mobile tests at:"
+            echo "  test/mobile/"
+            echo ""
+            echo "Please create this directory with your test files."
+            echo "See qvac-test-addon-mobile README for test file format."
+            exit 1
+          fi
+
+          # Check for .cjs test files
+          CJS_COUNT=$(find test/mobile -name "*.cjs" -type f | wc -l)
+          if [ "$CJS_COUNT" -eq 0 ]; then
+            echo "❌ ERROR: No .cjs test files found in test/mobile!"
+            exit 1
+          fi
+
+          echo "✅ Mobile test files found:"
+          ls -la test/mobile/*.cjs
+
+          # Check if testAssets exists
+          if [ -d "test/mobile/testAssets" ]; then
+            echo ""
+            echo "✅ Test assets found:"
+            ls -lah test/mobile/testAssets/
+          else
+            echo ""
+            echo "ℹ️  No testAssets directory (this is optional)"
+          fi
+
+      - name: Install Ninja build tool
+        if: matrix.platform == 'iOS'
+        run: |
+          echo "📦 Installing Ninja build system..."
+          brew install ninja
+          ninja --version
+          echo "✅ Ninja installed successfully"
+
+      - name: Install addon dependencies
+        working-directory: ${{ env.ADDON_WORKDIR }}
+        run: |
+          echo "Installing addon dependencies..."
+          npm install --ignore-scripts
+
+      - name: Validate mobile tests are up-to-date
+        working-directory: ${{ env.ADDON_WORKDIR }}
+        run: npm run test:mobile:validate
+
+      - name: Pack addon
+        working-directory: ${{ env.ADDON_WORKDIR }}
+        run: |
+          echo "Packing addon..."
+          if npm run build:pack 2>/dev/null; then
+            echo "✅ Addon packed using build:pack script"
+          else
+            echo "📦 Using npm pack directly..."
+            mkdir -p dist
+            npm pack --pack-destination dist --ignore-scripts
+          fi
+
+          # Verify pack file exists
+          PACK_FILE=$(ls dist/*.tgz | head -1)
+          if [ -f "$PACK_FILE" ]; then
+            SIZE=$(du -h "$PACK_FILE" | cut -f1)
+            echo "✅ Pack file created: $PACK_FILE (Size: $SIZE)"
+          else
+            echo "❌ Pack file not found in dist/"
+            exit 1
+          fi
+
+      - name: Setup test framework dependencies
+        working-directory: test-framework
+        run: |
+          echo "Setting up mobile test framework..."
+          npm install --ignore-scripts
+          echo "✅ Test framework dependencies installed"
+
+      - name: Build test app with addon
+        working-directory: test-framework
+        run: |
+          echo "Building test app with addon..."
+          echo "This will:"
+          echo "  1. Install the addon package"
+          echo "  2. Extract test code from addon's test/mobile/ directory"
+          echo "  3. Auto-detect and order test files by dependencies"
+          echo "  4. Generate backend.cjs with test functions"
+          echo "  5. Generate e2e tests for each test function"
+          echo "  6. Copy testAssets if available"
+          echo "  7. Bundle the app"
+          echo ""
+
+          ADDON_PATH="${GITHUB_WORKSPACE}/${{ env.ADDON_WORKDIR }}"
+          npm run build "$ADDON_PATH" "$ADDON_PATH/test/mobile"
+
+          echo ""
+          echo "✅ Test app built successfully"
+
+          # Verify critical files were generated
+          if [ ! -f "backend/backend.cjs" ]; then
+            echo "❌ ERROR: backend/backend.cjs was not generated!"
+            exit 1
+          fi
+
+          if [ ! -f "e2e/tests/app.test.js" ]; then
+            echo "❌ ERROR: e2e/tests/app.test.js was not generated!"
+            exit 1
+          fi
+
+          if [ ! -f "backend/app.bundle" ]; then
+            echo "❌ ERROR: backend/app.bundle was not created!"
+            exit 1
+          fi
+
+          echo "✅ All required files generated successfully"
+
+          # Show what tests were extracted
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "EXTRACTED TEST FUNCTIONS:"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          if [ -f "app/testConfig.js" ]; then
+            cat app/testConfig.js
+          fi
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+
+      - name: Display build summary
+        if: always()
+        working-directory: test-framework
+        run: |
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "📊 BUILD SUMMARY"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo ""
+          echo "Platform: ${{ matrix.platform }}"
+          if [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
+            echo "Package: ${{ inputs.package }}"
+          else
+            echo "Addon: ${{ env.ADDON_NAME }} (from PR artifacts)"
+          fi
+          echo ""
+          echo "Generated Files:"
+          echo "  backend/backend.cjs: $([ -f backend/backend.cjs ] && echo '✅' || echo '❌')"
+          echo "  backend/app.bundle: $([ -f backend/app.bundle ] && echo '✅' || echo '❌')"
+          echo "  app/testConfig.js: $([ -f app/testConfig.js ] && echo '✅' || echo '❌')"
+          echo "  app/assetManifest.js: $([ -f app/assetManifest.js ] && echo '✅' || echo '❌')"
+          echo "  e2e/tests/app.test.js: $([ -f e2e/tests/app.test.js ] && echo '✅' || echo '❌')"
+          echo ""
+          echo "Test Assets:"
+          if [ -d "testAssets" ]; then
+            ASSET_COUNT=$(find testAssets -type f | wc -l)
+            echo "  ✅ $ASSET_COUNT file(s) in testAssets/"
+          else
+            echo "  ℹ️  No testAssets (optional)"
+          fi
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+
+      # Android-specific steps
+      - name: Set up JDK 17
+        if: matrix.platform == 'Android'
+        uses: actions/setup-java@be666c2fcd27ec809703dec50e508c2fdc7f6654 # 5.2.0
+        with:
+          java-version: 17
+          distribution: temurin
+
+      - name: Setup Android SDK
+        if: matrix.platform == 'Android'
+        uses: android-actions/setup-android@9fc6c4e9069bf8d3d10b2204b1fb8f6ef7065407 # 3.2.2
+
+      - name: Generate Android project
+        if: matrix.platform == 'Android'
+        working-directory: test-framework
+        run: |
+          echo "Generating Android project with Expo..."
+          npx expo prebuild --platform android --clean
+
+      - name: Build Android APK
+        if: matrix.platform == 'Android'
+        id: build_apk
+        working-directory: test-framework
+        run: |
+          echo "Building Android APK for Device Farm..."
+          export JAVA_HOME=$JAVA_HOME_17_X64
+
+          # Bundle JavaScript
+          echo "Bundling JavaScript code..."
+          npm run bundle
+
+          if [ $? -ne 0 ]; then
+            echo "❌ Bundle failed"
+            exit 1
+          fi
+
+          echo "✅ Bundle completed successfully"
+
+          # Build RELEASE APK (not debug) to ensure JS bundle is included
+          # Debug builds skip bundling by default and try to connect to Metro
+          # Release builds embed the JS bundle in the APK
+          cd android
+          echo "Building APK with Gradle (RELEASE with embedded JS bundle)..."
+          ./gradlew assembleRelease \
+            -PreactNativeArchitectures=arm64-v8a \
+            --no-daemon \
+            --no-build-cache \
+            --stacktrace
+          cd ..
+
+          # Find the APK (look for release)
+          APK_PATH=$(find android/app/build/outputs/apk -name "*.apk" | grep "release" | grep -v "unaligned" | head -1)
+
+          if [ -f "$APK_PATH" ]; then
+            # Convert to absolute path
+            APK_ABSOLUTE_PATH="${GITHUB_WORKSPACE}/test-framework/$APK_PATH"
+            SIZE=$(du -h "$APK_PATH" | cut -f1)
+            echo "✅ APK built successfully: $APK_PATH (Size: $SIZE)"
+            echo "apk_path=$APK_ABSOLUTE_PATH" >> $GITHUB_OUTPUT
+            echo "app_type=ANDROID_APP" >> $GITHUB_OUTPUT
+            echo "app_name=test-app-${{ matrix.platform }}.apk" >> $GITHUB_OUTPUT
+
+            # Clean up build intermediates to free disk space
+            echo "Cleaning up build intermediates..."
+            rm -rf android/app/build/intermediates
+            rm -rf android/.gradle
+            df -h
+          else
+            echo "❌ APK file not found"
+            echo "Searching in android/app/build/outputs/apk:"
+            find android/app/build/outputs/apk -type f 2>/dev/null || echo "Directory not found"
+            exit 1
+          fi
+
+      # iOS-specific steps
+      - name: Set up Xcode version
+        if: matrix.platform == 'iOS'
+        run: |
+          echo "Available Xcode versions:"
+          ls /Applications | grep Xcode || echo "No Xcode apps found"
+
+          echo ""
+          echo "Current Xcode (before switch):"
+          xcodebuild -version
+
+          # React Native requires Xcode >= 16.1
+          # Use Xcode 16.1 (has iOS 18.1 SDK which is stable and pre-installed)
+          if [ -d "/Applications/Xcode_16.1.app" ]; then
+            echo ""
+            echo "✅ Switching to Xcode 16.1..."
+            sudo xcode-select -s /Applications/Xcode_16.1.app
+          elif [ -d "/Applications/Xcode_16.1.0.app" ]; then
+            echo ""
+            echo "✅ Switching to Xcode 16.1.0..."
+            sudo xcode-select -s /Applications/Xcode_16.1.0.app
+          elif [ -d "/Applications/Xcode_16.2.app" ]; then
+            echo ""
+            echo "⚠️  Using Xcode 16.2 (16.1 not found)..."
+            sudo xcode-select -s /Applications/Xcode_16.2.app
+          else
+            echo ""
+            echo "❌ ERROR: No suitable Xcode version found (need >= 16.1)"
+            exit 1
+          fi
+
+          echo ""
+          echo "Current Xcode (after switch):"
+          xcodebuild -version
+
+          echo ""
+          echo "Available iOS SDKs:"
+          xcodebuild -showsdks | grep -i ios
+
+      - name: Install CocoaPods
+        if: matrix.platform == 'iOS'
+        run: |
+          sudo gem install cocoapods
+          pod --version
+
+      - name: Create Keychain and Import Certificate
+        if: matrix.platform == 'iOS'
+        env:
+          BUILD_CERTIFICATE_BASE64: ${{ secrets.TEST_APP_APPLE_DISTRIBUTION_CERTIFICATE  }}
+          P12_PASSWORD: ${{ secrets.APPLE_P12_PASSWORD }}
+          BUILD_PROVISION_PROFILE_BASE64: ${{ secrets.TEST_APP_APPLE_PROVISIONING_PROFILE  }}
+          KEYCHAIN_PASSWORD: ${{ secrets.APPLE_KEYCHAIN_PASSWORD }}
+        run: |
+          CERTIFICATE_PATH=$RUNNER_TEMP/build_certificate.p12
+          PP_PATH=$RUNNER_TEMP/build_pp.mobileprovision
+          KEYCHAIN_PATH=$RUNNER_TEMP/app-signing.keychain-db
+
+          echo -n "$BUILD_CERTIFICATE_BASE64" | base64 --decode -o $CERTIFICATE_PATH
+          echo -n "$BUILD_PROVISION_PROFILE_BASE64" | base64 --decode -o $PP_PATH
+
+          security create-keychain -p "$KEYCHAIN_PASSWORD" $KEYCHAIN_PATH
+          security set-keychain-settings -lut 21600 $KEYCHAIN_PATH
+          security unlock-keychain -p "$KEYCHAIN_PASSWORD" $KEYCHAIN_PATH
+
+          security import $CERTIFICATE_PATH -P "$P12_PASSWORD" -A -t cert -f pkcs12 -k $KEYCHAIN_PATH
+          security set-key-partition-list -S apple-tool:,apple: -s -k "$KEYCHAIN_PASSWORD" $KEYCHAIN_PATH
+          security list-keychain -d user -s $KEYCHAIN_PATH
+
+          # Extract UUID first, then copy with UUID as filename
+          PP_UUID=$(/usr/libexec/PlistBuddy -c 'Print :UUID' /dev/stdin <<< $(security cms -D -i $PP_PATH))
+          echo "PP_UUID=$PP_UUID" >> $GITHUB_ENV
+          echo "Provisioning Profile UUID: $PP_UUID"
+
+          # Copy provisioning profile with UUID as filename
+          mkdir -p ~/Library/MobileDevice/Provisioning\ Profiles
+          cp $PP_PATH ~/Library/MobileDevice/Provisioning\ Profiles/$PP_UUID.mobileprovision
+
+          security find-identity -p codesigning -v
+
+      - name: Verify provisioning profile
+        if: matrix.platform == 'iOS'
+        run: |
+          echo "🔍 Verifying provisioning profile..."
+          echo "PP_UUID: $PP_UUID"
+
+          PP_FILE=~/Library/MobileDevice/Provisioning\ Profiles/$PP_UUID.mobileprovision
+          if [ ! -f "$PP_FILE" ]; then
+            echo "❌ Provisioning profile file not found at: $PP_FILE"
+            ls -la ~/Library/MobileDevice/Provisioning\ Profiles/
+            exit 1
+          fi
+
+          echo "📋 Provisioning Profile Details:"
+          security cms -D -i "$PP_FILE" > /tmp/profile.plist
+
+          PROFILE_NAME=$(/usr/libexec/PlistBuddy -c "Print :Name" /tmp/profile.plist 2>/dev/null || echo "Unknown")
+          PROFILE_BUNDLE_ID=$(/usr/libexec/PlistBuddy -c "Print :Entitlements:application-identifier" /tmp/profile.plist 2>/dev/null || echo "Unknown")
+          PROFILE_TEAM_ID=$(/usr/libexec/PlistBuddy -c "Print :Entitlements:com.apple.developer.team-identifier" /tmp/profile.plist 2>/dev/null || echo "Unknown")
+
+          # Detect profile type (Development, Ad Hoc, App Store, Enterprise)
+          HAS_DEVICES=$(/usr/libexec/PlistBuddy -c "Print :ProvisionedDevices" /tmp/profile.plist 2>/dev/null && echo "yes" || echo "no")
+          PROVISIONS_ALL=$(/usr/libexec/PlistBuddy -c "Print :ProvisionsAllDevices" /tmp/profile.plist 2>/dev/null || echo "false")
+          HAS_GET_TASK_ALLOW=$(/usr/libexec/PlistBuddy -c "Print :Entitlements:get-task-allow" /tmp/profile.plist 2>/dev/null || echo "false")
+
+          if [[ "$PROVISIONS_ALL" == "true" ]]; then
+            PROFILE_TYPE="Enterprise"
+            EXPORT_METHOD="enterprise"
+          elif [[ "$HAS_DEVICES" == "yes" && "$HAS_GET_TASK_ALLOW" == "true" ]]; then
+            PROFILE_TYPE="Development"
+            EXPORT_METHOD="development"
+          elif [[ "$HAS_DEVICES" == "yes" && "$HAS_GET_TASK_ALLOW" == "false" ]]; then
+            PROFILE_TYPE="Ad Hoc"
+            EXPORT_METHOD="ad-hoc"
+          else
+            PROFILE_TYPE="App Store"
+            EXPORT_METHOD="app-store"
+          fi
+
+          echo "  Name: $PROFILE_NAME"
+          echo "  Type: $PROFILE_TYPE"
+          echo "  Export Method: $EXPORT_METHOD"
+          echo "  Application ID: $PROFILE_BUNDLE_ID"
+          echo "  Team ID: $PROFILE_TEAM_ID"
+          echo "  Expected Bundle ID: ${{ env.APP_BUNDLE_ID }}"
+
+          # Save export method for next step
+          echo "EXPORT_METHOD=$EXPORT_METHOD" >> $GITHUB_ENV
+
+          # Extract just the bundle ID part (remove team prefix)
+          BUNDLE_ID_ONLY=$(echo "$PROFILE_BUNDLE_ID" | sed 's/^[^.]*\.//')
+
+          if [[ "$BUNDLE_ID_ONLY" != "${{ env.APP_BUNDLE_ID }}" ]]; then
+            echo ""
+            echo "❌ ERROR: Provisioning profile bundle ID mismatch!"
+            echo "   Profile has: $BUNDLE_ID_ONLY"
+            echo "   Expected: ${{ env.APP_BUNDLE_ID }}"
+            echo ""
+            echo "The provisioning profile was created for a different bundle identifier."
+            echo "Please create a new provisioning profile for: ${{ env.APP_BUNDLE_ID }}"
+            exit 1
+          fi
+
+          echo "✅ Provisioning profile matches expected bundle ID"
+
+      - name: Generate iOS project
+        if: matrix.platform == 'iOS'
+        working-directory: test-framework
+        run: |
+          echo "Generating iOS project with Expo..."
+          npx expo prebuild --platform ios --clean
+
+      - name: Install iOS dependencies
+        if: matrix.platform == 'iOS'
+        working-directory: test-framework/ios
+        run: |
+          echo "Installing CocoaPods dependencies..."
+          pod install --repo-update
+
+      - name: Build and Archive iOS App
+        if: matrix.platform == 'iOS'
+        id: build_ios
+        working-directory: test-framework
+        run: |
+          echo "Building iOS app for Device Farm..."
+
+          # Bundle JavaScript first
+          echo "Bundling JavaScript code..."
+          npm run bundle
+
+          if [ $? -ne 0 ]; then
+            echo "❌ Bundle failed"
+            exit 1
+          fi
+
+          echo "✅ Bundle completed successfully"
+
+          # Get scheme name
+          cd ios
+          SCHEME_NAME=$(xcodebuild -list | grep -A 1 "Schemes:" | grep -v "Schemes:" | head -1 | xargs)
+          echo "Detected scheme: $SCHEME_NAME"
+
+          # Debug: Check bundle identifier in project
+          echo "🔍 Checking project configuration..."
+          BUNDLE_ID=$(xcodebuild -showBuildSettings -workspace $SCHEME_NAME.xcworkspace -scheme "$SCHEME_NAME" -configuration Release -destination "generic/platform=iOS" 2>/dev/null | grep PRODUCT_BUNDLE_IDENTIFIER | head -1 | awk '{print $3}')
+          echo "Bundle Identifier in project: $BUNDLE_ID"
+
+          if [[ "$BUNDLE_ID" != "${{ env.APP_BUNDLE_ID }}" ]]; then
+            echo "⚠️  Warning: Bundle ID mismatch in Xcode project!"
+            echo "   Expected: ${{ env.APP_BUNDLE_ID }}"
+            echo "   Found: $BUNDLE_ID"
+          fi
+
+          # Debug: Check provisioning profile
+          echo "🔍 Provisioning profile UUID: $PP_UUID"
+          security cms -D -i ~/Library/MobileDevice/Provisioning\ Profiles/$PP_UUID.mobileprovision | grep -A 5 "application-identifier\|Name\|TeamIdentifier" | head -20 || echo "Could not read profile details"
+
+          # Archive for iOS device
+          xcodebuild -workspace $SCHEME_NAME.xcworkspace \
+            -scheme "$SCHEME_NAME" \
+            -sdk iphoneos \
+            -configuration Release \
+            -destination "generic/platform=iOS" \
+            -archivePath $RUNNER_TEMP/$SCHEME_NAME.xcarchive \
+            CODE_SIGN_STYLE=Manual \
+            PROVISIONING_PROFILE_SPECIFIER="$PP_UUID" \
+            CODE_SIGN_IDENTITY="Apple Distribution" \
+            DEVELOPMENT_TEAM="${{ secrets.APPLE_TEAM_ID }}" \
+            clean archive
+
+      - name: Export IPA
+        if: matrix.platform == 'iOS'
+        id: export_ipa
+        working-directory: test-framework/ios
+        run: |
+          SCHEME_NAME=$(xcodebuild -list | grep -A 1 "Schemes:" | grep -v "Schemes:" | head -1 | xargs)
+
+          # Create export options using auto-detected export method
+          # The EXPORT_METHOD was determined in the "Verify provisioning profile" step
+          echo "📦 Using export method: $EXPORT_METHOD"
+
+          EXPORT_OPTS_PATH=$RUNNER_TEMP/ExportOptions.plist
+          cat > $EXPORT_OPTS_PATH << EOF
+          <?xml version="1.0" encoding="UTF-8"?>
+          <!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+          <plist version="1.0">
+          <dict>
+            <key>method</key>
+            <string>$EXPORT_METHOD</string>
+            <key>teamID</key>
+            <string>${{ secrets.APPLE_TEAM_ID }}</string>
+            <key>signingStyle</key>
+            <string>manual</string>
+            <key>provisioningProfiles</key>
+            <dict>
+              <key>${{ env.APP_BUNDLE_ID }}</key>
+              <string>$PP_UUID</string>
+            </dict>
+          </dict>
+          </plist>
+          EOF
+
+          echo "📋 Export options:"
+          cat $EXPORT_OPTS_PATH
+
+          xcodebuild -exportArchive \
+            -archivePath $RUNNER_TEMP/$SCHEME_NAME.xcarchive \
+            -exportOptionsPlist $EXPORT_OPTS_PATH \
+            -exportPath $RUNNER_TEMP/build
+
+          IPA_FILE=$(find $RUNNER_TEMP/build -name "*.ipa" | head -1)
+          if [ -f "$IPA_FILE" ]; then
+            echo "✅ IPA exported: $IPA_FILE"
+            echo "apk_path=$IPA_FILE" >> $GITHUB_OUTPUT
+            echo "app_type=IOS_APP" >> $GITHUB_OUTPUT
+            echo "app_name=test-app-${{ matrix.platform }}.ipa" >> $GITHUB_OUTPUT
+          else
+            echo "❌ IPA file not found"
+            exit 1
+          fi
+
+      - name: Configure AWS credentials via OIDC
+        uses: aws-actions/configure-aws-credentials@8df5847569e6427dd6c4fb1cf565c83acfa8afa7 # 6.0.0
+        with:
+          role-to-assume: ${{ secrets.AWS_OIDC_ROLE_ARN }}
+          aws-region: us-west-2
+          role-duration-seconds: 7200 # 2hrs for device farm tests
+
+      - name: Upload App to Device Farm
+        id: upload_app
+        run: |
+          if [ "${{ matrix.platform }}" == "Android" ]; then
+            APP_PATH="${{ steps.build_apk.outputs.apk_path }}"
+            APP_TYPE="${{ steps.build_apk.outputs.app_type }}"
+            APP_NAME="${{ steps.build_apk.outputs.app_name }}"
+          else
+            APP_PATH="${{ steps.export_ipa.outputs.apk_path }}"
+            APP_TYPE="${{ steps.export_ipa.outputs.app_type }}"
+            APP_NAME="${{ steps.export_ipa.outputs.app_name }}"
+          fi
+
+          echo "📤 Uploading app to AWS Device Farm..."
+          UPLOAD_RESPONSE=$(aws devicefarm create-upload \
+            --project-arn "${{ secrets.LLM_AWS_DEVICE_FARM_PROJECT_ARN }}" \
+            --name "$APP_NAME" \
+            --type "$APP_TYPE" \
+            --output json)
+
+          if [ $? -ne 0 ]; then
+            echo "❌ Error creating upload in Device Farm"
+            echo "Response: $UPLOAD_RESPONSE"
+            exit 1
+          fi
+
+          APP_UPLOAD_URL=$(echo $UPLOAD_RESPONSE | jq -r '.upload.url')
+          APP_UPLOAD_ARN=$(echo $UPLOAD_RESPONSE | jq -r '.upload.arn')
+          echo "app_upload_arn=$APP_UPLOAD_ARN" >> $GITHUB_OUTPUT
+          echo "App upload ARN: $APP_UPLOAD_ARN"
+
+          echo "Uploading app file: $APP_PATH"
+          curl -T "$APP_PATH" "$APP_UPLOAD_URL"
+
+          if [ $? -ne 0 ]; then
+            echo "❌ Error uploading app file using curl"
+            exit 1
+          fi
+
+          # Wait for processing
+          echo "⏳ Waiting for upload to be processed..."
+          MAX_ATTEMPTS=30
+          ATTEMPT=1
+          while [ $ATTEMPT -le $MAX_ATTEMPTS ]; do
+            STATUS=$(aws devicefarm get-upload --arn "$APP_UPLOAD_ARN" --query "upload.status" --output text)
+            echo "Status (attempt $ATTEMPT/$MAX_ATTEMPTS): $STATUS"
+
+            if [ "$STATUS" = "SUCCEEDED" ]; then
+              echo "✅ App upload successful"
+              break
+            fi
+
+            if [ "$STATUS" = "FAILED" ]; then
+              echo "❌ Upload failed"
+              aws devicefarm get-upload --arn "$APP_UPLOAD_ARN"
+              exit 1
+            fi
+
+            sleep 10
+            ATTEMPT=$((ATTEMPT + 1))
+          done
+
+      - name: Verify test package generation
+        working-directory: test-framework/e2e
+        run: |
+          echo "Verifying e2e test package..."
+
+          if [ ! -f "package.json" ]; then
+            echo "❌ ERROR: e2e/package.json not found!"
+            exit 1
+          fi
+
+          if [ ! -f "tests/app.test.js" ]; then
+            echo "❌ ERROR: e2e/tests/app.test.js not found!"
+            exit 1
+          fi
+
+          echo "✅ E2E test files verified"
+          echo ""
+          echo "Test package contents:"
+          ls -la
+          echo ""
+          echo "Test files:"
+          ls -la tests/
+
+      - name: Package and Upload Test Package
+        id: upload_test_package
+        working-directory: test-framework
+        run: |
+          echo "📦 Packaging e2e tests..."
+          cd e2e
+
+          # Install dependencies before packing
+          npm install --ignore-scripts
+
+          # Create tarball
+          npm pack --ignore-scripts
+
+          # Create zip with test files only (no node_modules - will be installed on Device Farm)
+          ZIP_NAME="e2e-tests-${{ matrix.platform }}.zip"
+          zip -r "$ZIP_NAME" \
+            package.json \
+            tests/ \
+            *.tgz
+
+          echo "📦 Package contents (excluding node_modules):"
+          unzip -l "$ZIP_NAME" | head -20
+
+          # Verify zip was created
+          if [ ! -f "$ZIP_NAME" ]; then
+            echo "❌ ERROR: Failed to create test package zip"
+            exit 1
+          fi
+
+          SIZE=$(du -h "$ZIP_NAME" | cut -f1)
+          echo "✅ Test package created: $ZIP_NAME (Size: $SIZE)"
+
+          mv "$ZIP_NAME" "$GITHUB_WORKSPACE/"
+
+          # Upload test package to AWS Device Farm
+          echo "📤 Uploading test package to AWS Device Farm..."
+          UPLOAD_RESPONSE=$(aws devicefarm create-upload \
+            --project-arn "${{ secrets.LLM_AWS_DEVICE_FARM_PROJECT_ARN }}" \
+            --name "$ZIP_NAME" \
+            --type "APPIUM_NODE_TEST_PACKAGE" \
+            --output json)
+
+          if [ $? -ne 0 ]; then
+            echo "❌ Error creating test package upload in Device Farm"
+            echo "Response: $UPLOAD_RESPONSE"
+            exit 1
+          fi
+
+          TEST_UPLOAD_URL=$(echo $UPLOAD_RESPONSE | jq -r '.upload.url')
+          TEST_UPLOAD_ARN=$(echo $UPLOAD_RESPONSE | jq -r '.upload.arn')
+          echo "test_package_upload_arn=$TEST_UPLOAD_ARN" >> $GITHUB_OUTPUT
+          echo "Test package upload ARN: $TEST_UPLOAD_ARN"
+
+          echo "Uploading to: $TEST_UPLOAD_URL"
+          curl -T "$GITHUB_WORKSPACE/$ZIP_NAME" "$TEST_UPLOAD_URL"
+
+          if [ $? -ne 0 ]; then
+            echo "❌ Error uploading test package using curl"
+            exit 1
+          fi
+
+          # Wait for processing
+          echo "⏳ Waiting for test package to be processed..."
+          MAX_ATTEMPTS=30
+          ATTEMPT=1
+          while [ $ATTEMPT -le $MAX_ATTEMPTS ]; do
+            STATUS=$(aws devicefarm get-upload --arn "$TEST_UPLOAD_ARN" --query "upload.status" --output text)
+            echo "Test package status (attempt $ATTEMPT/$MAX_ATTEMPTS): $STATUS"
+
+            if [ "$STATUS" = "SUCCEEDED" ]; then
+              echo "✅ Test package upload successful"
+              break
+            fi
+
+            if [ "$STATUS" = "FAILED" ]; then
+              echo "❌ Test package upload failed"
+              aws devicefarm get-upload --arn "$TEST_UPLOAD_ARN"
+              exit 1
+            fi
+
+            sleep 10
+            ATTEMPT=$((ATTEMPT + 1))
+          done
+
+          if [ $ATTEMPT -gt $MAX_ATTEMPTS ]; then
+            echo "❌ Timeout waiting for test package processing"
+            exit 1
+          fi
+
+      # NOTE: Everything below remains unchanged from your source workflow.
+      # The only monorepo-related change in this entire file is that "addon" operations
+      # now target addon/packages/classification-ggml via env.ADDON_WORKDIR.
+
+      - name: Create and Upload Test Spec
+        id: upload_test_spec
+        run: |
+          echo "📝 Creating test spec for custom environment mode..."
+          echo "Platform: ${{ matrix.platform }}"
+          
+          # Create platform-specific test spec using printf for precise control
+          # NOTE: Both platforms use a 'before' hook in the wdio config to click the button
+          # This ensures a single Appium session for reliability (no session handoff issues)
+          # The before hook includes crash detection using queryAppState
+          if [ "${{ matrix.platform }}" == "Android" ]; then
+            PLATFORM="Android"
+            AUTOMATION="UiAutomator2"
+            HOST_LINE="android_test_host: amazon_linux_2"
+            BUNDLE_ID="${{ env.APP_BUNDLE_ID }}"
+            # Android wdio config with crash detection (bail:0 = continue on test failures, crash = process.exit)
+            # Increased timeout to 30 minutes (1800000ms) for long-running LLM tests
+            WDIO_CONFIG='exports.config={runner:"local",hostname:"127.0.0.1",port:4723,path:"/wd/hub",specs:["*.spec.js","*.test.js"],maxInstances:1,bail:0,capabilities:[{platformName:"Android","appium:automationName":"UiAutomator2","appium:appPackage":"'${{ env.APP_BUNDLE_ID }}'","appium:appActivity":"'${{ env.APP_BUNDLE_ID }}'.MainActivity","appium:newCommandTimeout":300,"appium:autoGrantPermissions":true,"appium:autoAcceptAlerts":true,"appium:noReset":true,"appium:dontStopAppOnReset":true,"appium:forceAppLaunch":false}],logLevel:"debug",waitforTimeout:120000,connectionRetryTimeout:30000,connectionRetryCount:3,services:[],framework:"mocha",reporters:["spec"],mochaOpts:{ui:"bdd",timeout:1800000},before:async function(capabilities,specs,browser){const BUNDLE_ID="'${{ env.APP_BUNDLE_ID }}'";global.appCrashed=false;global.checkAppCrash=async(stage)=>{try{const state=await browser.queryAppState(BUNDLE_ID);console.log("["+stage+"] App state: "+state+" (4=foreground,3=background,1=not running)");if(state<3){console.error("\\n🛑 APP CRASHED at "+stage+"! State="+state);console.error("Check device logs for BareKit/native errors.\\n");global.appCrashed=true;process.exit(1);}return state;}catch(e){console.log("["+stage+"] queryAppState error: "+e.message);return-1;}};console.log("Checking initial app state...");await global.checkAppCrash("startup");console.log("Waiting for app to initialize...");await browser.pause(5000);await global.checkAppCrash("after-pause");const initText=await browser.$("android=new UiSelector().textContains(\"INITIALIZED\")");await initText.waitForDisplayed({timeout:60000});await global.checkAppCrash("after-init");console.log("App initialized, clicking Run Automated Tests...");const button=await browser.$("android=new UiSelector().textContains(\"Run Automated Tests\")");await button.waitForDisplayed({timeout:15000});await button.click();console.log("Button clicked!");await browser.pause(5000);await global.checkAppCrash("after-click");},after:async function(result,capabilities,specs){try{const fs=require("fs");const path=require("path");const artifactDir=path.resolve(process.cwd(),"tests","artifacts");const artifactPath=path.join(artifactDir,"android-generated-images.zip");const remoteDirs=["/sdcard/Download/qvac-generated-images","/storage/emulated/0/Download/qvac-generated-images"];fs.mkdirSync(artifactDir,{recursive:true});if(typeof browser.pullFolder!=="function"){console.log("No Android generated image artifacts collected: browser.pullFolder is not available");return;}let saved=false;for(const remoteDir of remoteDirs){try{console.log("Attempting to pull generated images from "+remoteDir);const folderData=await browser.pullFolder(remoteDir);fs.writeFileSync(artifactPath,Buffer.from(folderData,"base64"));console.log("Saved generated image artifacts to "+artifactPath);saved=true;break;}catch(e){console.log("Could not pull Android generated images from "+remoteDir+": "+e.message);}}if(!saved){console.log("No Android generated image artifacts collected");}}catch(e){console.log("No Android generated image artifacts collected: "+e.message);}},afterTest:async function(test,context,{error}){if(global.appCrashed)return;await global.checkAppCrash("after-test:"+test.title);}};'
+          else
+            PLATFORM="iOS"
+            AUTOMATION="XCUITest"
+            # iOS 18+ requires macos_sequoia test host (supports iOS 15-26)
+            HOST_LINE="ios_test_host: macos_sequoia"
+            BUNDLE_ID="${{ env.APP_BUNDLE_ID }}"
+            # iOS wdio config with crash detection (bail:0 = continue on test failures, crash = process.exit)
+            # usePrebuiltWDA uses Device Farm's pre-built WebDriverAgent
+            # Increased timeout to 30 minutes (1800000ms) for long-running LLM tests
+            WDIO_CONFIG='exports.config={runner:"local",hostname:"127.0.0.1",port:4723,path:"/wd/hub",specs:["*.spec.js","*.test.js"],maxInstances:1,bail:0,capabilities:[{platformName:"iOS","appium:automationName":"XCUITest","appium:bundleId":"'${{ env.APP_BUNDLE_ID }}'","appium:newCommandTimeout":300,"appium:noReset":true,"appium:forceAppLaunch":false,"appium:usePrebuiltWDA":true,"appium:wdaLocalPort":8100,"appium:showIOSLog":true,"appium:realDeviceLogger":"/usr/local/lib/node_modules/appium/node_modules/deviceconsole/deviceconsole"}],logLevel:"debug",waitforTimeout:120000,connectionRetryTimeout:30000,connectionRetryCount:3,services:[],framework:"mocha",reporters:["spec"],mochaOpts:{ui:"bdd",timeout:1800000},before:async function(capabilities,specs,browser){const BUNDLE_ID="'${{ env.APP_BUNDLE_ID }}'";global.appCrashed=false;global.checkAppCrash=async(stage)=>{try{const state=await browser.queryAppState(BUNDLE_ID);console.log("["+stage+"] App state: "+state+" (4=foreground,3=background,1=not running)");if(state<3){console.error("\\n🛑 APP CRASHED at "+stage+"! State="+state);console.error("Check device logs for BareKit/native errors.\\n");global.appCrashed=true;process.exit(1);}return state;}catch(e){console.log("["+stage+"] queryAppState error: "+e.message);return-1;}};console.log("Checking initial app state...");await global.checkAppCrash("startup");console.log("Waiting for app to initialize...");await browser.pause(5000);await global.checkAppCrash("after-pause");const initText=await browser.$("-ios predicate string:label CONTAINS \"INITIALIZED\"");await initText.waitForDisplayed({timeout:60000});await global.checkAppCrash("after-init");console.log("App initialized, clicking Run Automated Tests...");const button=await browser.$("-ios predicate string:label CONTAINS \"Run Automated Tests\"");await button.waitForDisplayed({timeout:15000});await button.click();console.log("Button clicked!");await browser.pause(5000);await global.checkAppCrash("after-click");},after:async function(result,capabilities,specs){try{const fs=require("fs");const path=require("path");const artifactDir=path.resolve(process.cwd(),"tests","artifacts");const remoteArtifactDir="@'${{ env.APP_BUNDLE_ID }}':documents/test/generated-images/";const artifactPath=path.join(artifactDir,"ios-generated-images.zip");fs.mkdirSync(artifactDir,{recursive:true});if(typeof browser.pullFolder!=="function"){console.log("No iOS generated image artifacts collected: browser.pullFolder is not available");return;}console.log("Attempting to pull generated images from "+remoteArtifactDir);const folderData=await browser.pullFolder(remoteArtifactDir);fs.writeFileSync(artifactPath,Buffer.from(folderData,"base64"));console.log("Saved generated image artifacts to "+artifactPath);}catch(e){console.log("No iOS generated image artifacts collected: "+e.message);}},afterTest:async function(test,context,{error}){if(global.appCrashed)return;await global.checkAppCrash("after-test:"+test.title);}};'
+          fi
+          
+          # Base64 encode the wdio config to safely embed in YAML
+          # Note: macOS base64 doesn't support -w flag (no line wrapping by default)
+          WDIO_CONFIG_B64=$(echo "$WDIO_CONFIG" | base64 | tr -d '\n')
+          
+          # Create test spec YAML using printf to avoid variable expansion issues
+          {
+            printf 'version: 0.1\n'
+            if [ -n "$HOST_LINE" ]; then
+              printf '%s\n' "$HOST_LINE"
+            fi
+            printf '\n'
+            printf 'phases:\n'
+            printf '  install:\n'
+            printf '    commands:\n'
+            printf '      - echo "Setting up Node.js environment..."\n'
+            printf '      - export NVM_DIR=$HOME/.nvm\n'
+            printf '      - . $NVM_DIR/nvm.sh 2>/dev/null || true\n'
+            printf '      - nvm install 18 2>/dev/null || true\n'
+            printf '      - nvm use 18 2>/dev/null || true\n'
+            printf '      - node --version || echo "Using system node"\n'
+            printf '\n'
+            printf '  pre_test:\n'
+            printf '    commands:\n'
+            printf '      - echo "Setting up test environment..."\n'
+            printf '      - cd $DEVICEFARM_TEST_PACKAGE_PATH\n'
+            printf '      - ls -la\n'
+            printf '      - echo "Installing dependencies (clean install)..."\n'
+            printf '      - rm -rf node_modules package-lock.json 2>/dev/null || true\n'
+            printf '      - npm install --legacy-peer-deps 2>&1\n'
+            printf '      - echo "Verifying wdio installation..."\n'
+            printf '      - ls -la node_modules/.bin/ | grep wdio || echo "wdio not found in .bin"\n'
+            printf '      - node node_modules/@wdio/cli/bin/wdio.js --version || echo "wdio version check failed"\n'
+            printf '      - echo "Creating wdio config for Device Farm..."\n'
+            printf '      - echo "%s" | base64 -d > tests/wdio.config.devicefarm.js\n' "$WDIO_CONFIG_B64"
+            printf '      - cat tests/wdio.config.devicefarm.js\n'
+          
+          # iOS-specific WebDriverAgent configuration (only for iOS platform)
+          if [ "${{ matrix.platform }}" == "iOS" ]; then
+            printf '      - echo "🔧 Configuring WebDriverAgent for iOS..."\n'
+            printf '      - export DEVICEFARM_APPIUM_WDA_DERIVED_DATA_PATH=$DEVICEFARM_APPIUM_WDA_DERIVED_DATA_PATH_V9\n'
+            printf '      - echo "WDA Path: $DEVICEFARM_APPIUM_WDA_DERIVED_DATA_PATH"\n'
+          fi
+          
+            printf '      - echo "🚀 Starting Appium server..."\n'
+            printf '      - export APPIUM_BASE_PATH=/wd/hub\n'
+            printf '      - |\n'
+            printf '        appium --base-path=$APPIUM_BASE_PATH --log-timestamp \\\n'
+            printf '          --log-no-colors --relaxed-security --default-capabilities \\\n'
+            printf '          "{\\"appium:deviceName\\": \\"$DEVICEFARM_DEVICE_NAME\\", \\\n'
+            printf '          \\"platformName\\": \\"$DEVICEFARM_DEVICE_PLATFORM_NAME\\", \\\n'
+            printf '          \\"appium:app\\": \\"$DEVICEFARM_APP_PATH\\", \\\n'
+            printf '          \\"appium:udid\\":\\"$DEVICEFARM_DEVICE_UDID\\", \\\n'
+            printf '          \\"appium:platformVersion\\": \\"$DEVICEFARM_DEVICE_OS_VERSION\\", \\\n'
+            printf '          \\"appium:chromedriverExecutableDir\\": \\"$DEVICEFARM_CHROMEDRIVER_EXECUTABLE_DIR\\", \\\n'
+            printf '          \\"appium:wdaLocalPort\\": 8100, \\\n'
+            printf '          \\"appium:derivedDataPath\\": \\"$DEVICEFARM_APPIUM_WDA_DERIVED_DATA_PATH\\", \\\n'
+            printf '          \\"appium:usePrebuiltWDA\\": true, \\\n'
+            printf '          \\"appium:automationName\\": \\"%s\\"}" \\\n' "$AUTOMATION"
+            printf '          >> $DEVICEFARM_LOG_DIR/appium.log 2>&1 &\n'
+            printf '      - echo "⏳ Waiting for Appium to be ready (max 30 seconds)..."\n'
+            printf '      - |\n'
+            printf '        appium_initialization_time=0\n'
+            printf '        until curl --silent --fail "http://0.0.0.0:4723${APPIUM_BASE_PATH}/status"; do\n'
+            printf '          if [[ $appium_initialization_time -gt 30 ]]; then\n'
+            printf '            echo "❌ Appium did not start within 30 seconds. Exiting..."\n'
+            printf '            cat $DEVICEFARM_LOG_DIR/appium.log\n'
+            printf '            exit 1\n'
+            printf '          fi\n'
+            printf '          appium_initialization_time=$((appium_initialization_time + 1))\n'
+            printf '          echo "Waiting for Appium to start on port 4723 (${appium_initialization_time}s/30s)..."\n'
+            printf '          sleep 1\n'
+            printf '        done\n'
+            printf '      - echo "✅ Appium server is ready!"\n'
+            printf '      - curl -s http://0.0.0.0:4723${APPIUM_BASE_PATH}/status || echo "Status check failed"\n'
+            printf '      - echo "ℹ️  Button click handled via WebDriverIO before hook (single session)"\n'
+            printf '\n'
+            printf '  test:\n'
+            printf '    commands:\n'
+            printf '      - echo "🧪 Running WebDriverIO tests..."\n'
+            printf '      - cd $DEVICEFARM_TEST_PACKAGE_PATH\n'
+            printf '      - echo "Verifying Appium is still running..."\n'
+            printf '      - ps aux | grep appium | grep -v grep || echo "⚠️  Appium process not found"\n'
+            printf '      - curl -s http://127.0.0.1:4723/wd/hub/status || echo "⚠️  Appium status check failed"\n'
+          
+            printf '      - echo "Starting wdio test execution..."\n'
+            printf '      - node node_modules/@wdio/cli/bin/wdio.js run tests/wdio.config.devicefarm.js\n'
+            printf '\n'
+            printf '  post_test:\n'
+            printf '    commands:\n'
+            printf '      - echo "Test completed"\n'
+            printf '      - cd $DEVICEFARM_TEST_PACKAGE_PATH\n'
+            printf '      - |\n'
+            printf '        if [ -d tests/artifacts ]; then\n'
+            printf '          mkdir -p "$DEVICEFARM_LOG_DIR/generated-images"\n'
+            printf '          if ls tests/artifacts/* >/dev/null 2>&1; then\n'
+            printf '            cp tests/artifacts/* "$DEVICEFARM_LOG_DIR/generated-images/"\n'
+            printf '            echo "Copied generated image artifacts to $DEVICEFARM_LOG_DIR/generated-images"\n'
+            printf '          else\n'
+            printf '            echo "No generated image artifacts found in tests/artifacts"\n'
+            printf '          fi\n'
+            printf '        else\n'
+            printf '          echo "No tests/artifacts directory found"\n'
+            printf '        fi\n'
+          
+          # iOS-specific: Output captured device logs
+          if [ "${{ matrix.platform }}" == "iOS" ]; then
+            printf '      - echo ""\n'
+            printf '      - echo "📱 ========== iOS Device Console Logs =========="\n'
+            printf '      - |\n'
+            printf '        if [ -f "$DEVICEFARM_LOG_DIR/device_console.log" ]; then\n'
+            printf '          echo "Device console log found, showing BareKit output:"\n'
+            printf '          grep -i "bare\|console\|model\|embedding\|test\|error" "$DEVICEFARM_LOG_DIR/device_console.log" || echo "No matching logs found"\n'
+            printf '        else\n'
+            printf '          echo "No device_console.log file found"\n'
+            printf '        fi\n'
+            printf '      - echo ""\n'
+            printf '      - echo "📋 Available log files:"\n'
+            printf '      - ls -lh $DEVICEFARM_LOG_DIR/ || echo "Log directory not accessible"\n'
+          fi
+            printf '\n'
+            printf 'artifacts:\n'
+            printf '  - $DEVICEFARM_LOG_DIR\n'
+          } > testspec.yml
+          
+          echo "Generated test spec:"
+          echo "===================="
+          cat testspec.yml
+          echo "===================="
+          
+          echo "📤 Uploading test spec to Device Farm..."
+          SPEC_RESPONSE=$(aws devicefarm create-upload \
+            --project-arn "${{ secrets.LLM_AWS_DEVICE_FARM_PROJECT_ARN }}" \
+            --name "testspec.yml" \
+            --type "APPIUM_NODE_TEST_SPEC" \
+            --output json)
+          
+          SPEC_UPLOAD_URL=$(echo $SPEC_RESPONSE | jq -r '.upload.url')
+          SPEC_UPLOAD_ARN=$(echo $SPEC_RESPONSE | jq -r '.upload.arn')
+          echo "test_spec_arn=$SPEC_UPLOAD_ARN" >> $GITHUB_OUTPUT
+          
+          curl -T testspec.yml "$SPEC_UPLOAD_URL"
+          
+          # Wait for processing
+          echo "⏳ Waiting for test spec to be processed..."
+          MAX_ATTEMPTS=20
+          ATTEMPT=1
+          while [ $ATTEMPT -le $MAX_ATTEMPTS ]; do
+            STATUS=$(aws devicefarm get-upload --arn "$SPEC_UPLOAD_ARN" --query "upload.status" --output text)
+            echo "Test spec status (attempt $ATTEMPT/$MAX_ATTEMPTS): $STATUS"
+            
+            if [ "$STATUS" = "SUCCEEDED" ]; then
+              echo "✅ Test spec upload successful"
+              break
+            fi
+            
+            if [ "$STATUS" = "FAILED" ]; then
+              echo "❌ Test spec upload failed"
+              aws devicefarm get-upload --arn "$SPEC_UPLOAD_ARN"
+              exit 1
+            fi
+            
+            sleep 5
+            ATTEMPT=$((ATTEMPT + 1))
+          done
+
+      - name: Schedule Device Farm Test Run
+        id: schedule_run
+        run: |
+          if [ "${{ matrix.platform }}" == "Android" ]; then
+            POOL_ARN="${{ secrets.LLM_ANDROID_DEVICE_POOL_ARN }}"
+          else
+            POOL_ARN="${{ secrets.LLM_IOS_DEVICE_POOL_ARN }}"
+          fi
+          
+          # Set run name based on trigger
+          if [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
+            RUN_NAME="Manual-${{ github.run_number }}-${{ matrix.platform }}"
+          else
+            RUN_NAME="PR-${{ github.event.pull_request.number || github.run_number }}-${{ matrix.platform }}"
+          fi
+          
+          echo "🚀 Scheduling Device Farm test run..."
+          echo "Platform: ${{ matrix.platform }}"
+          echo "Device Pool ARN: $POOL_ARN"
+          echo "Run Name: $RUN_NAME"
+          
+          RUN_ARN=$(aws devicefarm schedule-run \
+            --project-arn "${{ secrets.LLM_AWS_DEVICE_FARM_PROJECT_ARN }}" \
+            --device-pool-arn "$POOL_ARN" \
+            --app-arn "${{ steps.upload_app.outputs.app_upload_arn }}" \
+            --name "$RUN_NAME" \
+            --test type=APPIUM_NODE,testPackageArn="${{ steps.upload_test_package.outputs.test_package_upload_arn }}",testSpecArn="${{ steps.upload_test_spec.outputs.test_spec_arn }}" \
+            --query 'run.arn' --output text)
+          
+          echo "run_arn=$RUN_ARN" >> $GITHUB_OUTPUT
+          echo "✅ Test run scheduled: $RUN_ARN"
+
+      - name: Monitor Test Run
+        id: monitor_run
+        run: |
+          RUN_ARN="${{ steps.schedule_run.outputs.run_arn }}"
+          echo "📊 Monitoring test run: $RUN_ARN"
+          echo ""
+          
+          MAX_WAIT_TIME=7200  # 120 minutes
+          ELAPSED=0
+          
+          while true; do
+            STATUS=$(aws devicefarm get-run --arn "$RUN_ARN" --query 'run.status' --output text)
+            RESULT=$(aws devicefarm get-run --arn "$RUN_ARN" --query 'run.result' --output text)
+            
+            echo "⏳ Run status: $STATUS (Result: $RESULT) - Elapsed: ${ELAPSED}s"
+            
+            if [[ "$STATUS" == "COMPLETED" ]]; then
+              echo ""
+              echo "✅ Test run completed!"
+              break
+            fi
+            
+            if [ $ELAPSED -ge $MAX_WAIT_TIME ]; then
+              echo ""
+              echo "❌ Timeout: Test run exceeded $MAX_WAIT_TIME seconds"
+              exit 1
+            fi
+            
+            sleep 30
+            ELAPSED=$((ELAPSED + 30))
+          done
+          
+          # Get detailed results
+          RUN_DETAILS=$(aws devicefarm get-run --arn "$RUN_ARN" --output json)
+          RESULT=$(echo $RUN_DETAILS | jq -r '.run.result')
+          COUNTERS=$(echo $RUN_DETAILS | jq -r '.run.counters')
+          
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "📊 FINAL TEST RESULTS"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "Result: $RESULT"
+          echo ""
+          
+          # Get jobs (devices) and extract actual test names
+          echo "📱 Fetching detailed test results..."
+          JOBS=$(aws devicefarm list-jobs --arn "$RUN_ARN" --output json)
+          
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "📋 YOUR TESTS (excluding Setup/Teardown)"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo ""
+          
+          DEVICE_COUNT=0
+          USER_TEST_COUNT=0
+          USER_PASSED=0
+          USER_FAILED=0
+          FAILED_TEST_DETAILS=()
+          
+          # Extract project ID and run ID from RUN_ARN for console links
+          # RUN_ARN format: arn:aws:devicefarm:us-west-2:ACCOUNT:run:PROJECT_ID/RUN_ID
+          PROJECT_ID=$(echo "$RUN_ARN" | sed -n 's/.*:run:\([^/]*\)\/.*/\1/p')
+          RUN_ID=$(echo "$RUN_ARN" | sed -n 's/.*:run:[^/]*\/\(.*\)/\1/p')
+          
+          # Process each device/job
+          for JOB_ARN in $(echo "$JOBS" | jq -r '.jobs[].arn'); do
+            DEVICE_COUNT=$((DEVICE_COUNT + 1))
+            JOB_DETAILS=$(aws devicefarm get-job --arn "$JOB_ARN" --output json)
+            DEVICE_NAME=$(echo "$JOB_DETAILS" | jq -r '.job.device.name // "Unknown Device"')
+            JOB_RESULT=$(echo "$JOB_DETAILS" | jq -r '.job.result // "UNKNOWN"')
+            JOB_ID=$(echo "$JOB_ARN" | sed -n 's/.*:job:[^/]*\/[^/]*\/\(.*\)/\1/p')
+            
+            # Build console link (no region param needed when region is in subdomain)
+            CONSOLE_LINK="https://us-west-2.console.aws.amazon.com/devicefarm/home#/mobile/projects/${PROJECT_ID}/runs/${RUN_ID}/jobs/${JOB_ID}"
+            
+            if [ "$JOB_RESULT" = "PASSED" ]; then
+              echo "   ✅ $DEVICE_NAME: PASSED"
+              USER_PASSED=$((USER_PASSED + 1))
+            else
+              echo "   ❌ $DEVICE_NAME: $JOB_RESULT"
+              USER_FAILED=$((USER_FAILED + 1))
+              FAILED_TEST_DETAILS+=("❌ $DEVICE_NAME: $JOB_RESULT")
+              FAILED_TEST_DETAILS+=("   📎 View logs: $CONSOLE_LINK")
+            fi
+            
+            USER_TEST_COUNT=$((USER_TEST_COUNT + 1))
+            echo ""
+          done
+          
+          # Show AWS Device Farm console link for the entire run
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "🔗 AWS DEVICE FARM LINKS"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo ""
+          echo "📊 Full Run Details:"
+          echo "   https://us-west-2.console.aws.amazon.com/devicefarm/home#/mobile/projects/${PROJECT_ID}/runs/${RUN_ID}"
+          echo ""
+          echo "💡 Tip: Click the link above, then select a device to view:"
+          echo "   • Video recording of the test"
+          echo "   • Screenshots"  
+          echo "   • Device logs"
+          echo "   • Test spec output (shows individual test results)"
+          echo ""
+          
+          # Summary
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "📊 SUMMARY"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo ""
+          echo "Devices tested: $DEVICE_COUNT"
+          echo "  ✅ Passed: $USER_PASSED"
+          echo "  ❌ Failed: $USER_FAILED"
+          echo ""
+          echo "📋 What these tests verify:"
+          echo "   The E2E tests run on Device Farm check that your app:"
+          echo "   1. Shows 'INITIALIZED' after startup"
+          echo "   2. Runs all test functions from test/mobile/*.cjs"
+          echo "   3. Reports PASS/FAIL for each test function"
+          echo ""
+          echo "💡 If a test times out but the video shows PASS:"
+          echo "   → The app test passed, but E2E gave up waiting too early"
+          echo "   → Check timeout settings in qvac-test-addon-mobile"
+          echo ""
+          echo "Device Farm Counters (includes Setup/Teardown):"
+          echo "$COUNTERS" | jq '.'
+          echo ""
+          
+          if [ ${#FAILED_TEST_DETAILS[@]} -gt 0 ]; then
+            echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+            echo "❌ FAILED TESTS"
+            echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+            for failed_info in "${FAILED_TEST_DETAILS[@]}"; do
+              echo "$failed_info"
+            done
+            echo ""
+          fi
+          
+          # Save for PR comment
+          echo "test_result=$RESULT" >> $GITHUB_OUTPUT
+          echo "test_counters<<EOF" >> $GITHUB_OUTPUT
+          echo "$COUNTERS" >> $GITHUB_OUTPUT
+          echo "EOF" >> $GITHUB_OUTPUT
+          
+          # Extract test counts
+          TOTAL=$(echo $COUNTERS | jq -r '.total // 0')
+          PASSED=$(echo $COUNTERS | jq -r '.passed // 0')
+          FAILED=$(echo $COUNTERS | jq -r '.failed // 0')
+          SKIPPED=$(echo $COUNTERS | jq -r '.skipped // 0')
+          
+          echo "test_total=$TOTAL" >> $GITHUB_OUTPUT
+          echo "test_passed=$PASSED" >> $GITHUB_OUTPUT
+          echo "test_failed=$FAILED" >> $GITHUB_OUTPUT
+          echo "test_skipped=$SKIPPED" >> $GITHUB_OUTPUT
+          
+          # Also save user test counts
+          echo "user_test_count=$USER_TEST_COUNT" >> $GITHUB_OUTPUT
+          echo "user_test_passed=$USER_PASSED" >> $GITHUB_OUTPUT
+          echo "user_test_failed=$USER_FAILED" >> $GITHUB_OUTPUT
+          
+          # Determine if tests passed or failed
+          # Red status (exit 1) if:
+          #   1. Device Farm overall result is not PASSED, OR
+          #   2. Any of your tests failed
+          # Green status (exit 0) only if all tests passed
+          
+          if [[ "$RESULT" != "PASSED" ]] || [ $USER_FAILED -gt 0 ]; then
+            echo ""
+            echo "❌ Device Farm tests failed"
+            if [[ "$RESULT" != "PASSED" ]]; then
+              echo "   Device Farm result: $RESULT"
+            fi
+            echo "   Your tests: $USER_PASSED passed, $USER_FAILED failed (out of $USER_TEST_COUNT total)"
+            echo "   Device Farm total: $TOTAL | Passed: $PASSED | Failed: $FAILED | Skipped: $SKIPPED"
+            exit 1
+          fi
+          
+          echo ""
+          echo "✅ All Device Farm tests passed!"
+          echo "   Your tests: $USER_PASSED passed (out of $USER_TEST_COUNT total)"
+          echo "   Device Farm total: $TOTAL | Passed: $PASSED | Failed: $FAILED | Skipped: $SKIPPED"
+
+      - name: Refresh AWS credentials for log download
+        if: always() && steps.schedule_run.outputs.run_arn
+        uses: aws-actions/configure-aws-credentials@8df5847569e6427dd6c4fb1cf565c83acfa8afa7 # 6.0.0
+        with:
+          role-to-assume: ${{ secrets.AWS_OIDC_ROLE_ARN }}
+          aws-region: us-west-2
+          role-session-name: device-farm-logs
+
+      - name: Download Device Farm Logs
+        if: always() && steps.schedule_run.outputs.run_arn
+        run: |
+          RUN_ARN="${{ steps.schedule_run.outputs.run_arn }}"
+          LOG_DIR="devicefarm-logs/${{ matrix.platform }}"
+          PLATFORM="${{ matrix.platform }}"
+          mkdir -p "$LOG_DIR"
+
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "📥 DOWNLOADING DEVICE FARM LOGS"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo ""
+          echo "Logs are downloaded so anyone with repo access can view them"
+          echo "without needing AWS Device Farm credentials."
+          if [ "$PLATFORM" = "Android" ]; then
+            echo "ℹ️  Skipping video artifacts on Android to reduce artifact size."
+          fi
+          echo ""
+
+          RUN_DETAILS=$(aws devicefarm get-run --arn "$RUN_ARN" --output json 2>/dev/null || echo '{}')
+          RUN_LABEL=$(echo "$RUN_DETAILS" | jq -r '.run.name // "unknown"')
+          echo ""
+          echo "========================================"
+          echo "📦 Run: $RUN_LABEL"
+          echo "========================================"
+
+          SAFE_RUN=$(echo "$RUN_LABEL" | tr ' /' '__' | tr -cd '[:alnum:]_-')
+          JOBS=$(aws devicefarm list-jobs --arn "$RUN_ARN" --output json 2>/dev/null || echo '{"jobs":[]}')
+
+          for JOB_ARN in $(echo "$JOBS" | jq -r '.jobs[].arn'); do
+            DEVICE_NAME=$(echo "$JOBS" | jq -r --arg arn "$JOB_ARN" '.jobs[] | select(.arn == $arn) | .device.name // "unknown"')
+            JOB_RESULT=$(echo "$JOBS" | jq -r --arg arn "$JOB_ARN" '.jobs[] | select(.arn == $arn) | .result // "UNKNOWN"')
+            SAFE_NAME=$(echo "$DEVICE_NAME" | tr ' /' '__' | tr -cd '[:alnum:]_-')
+
+            echo ""
+            echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+            echo "📱 $DEVICE_NAME ($JOB_RESULT)"
+            echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+
+            SUITES=$(aws devicefarm list-suites --arn "$JOB_ARN" --output json 2>/dev/null || echo '{"suites":[]}')
+
+            for SUITE_ARN in $(echo "$SUITES" | jq -r '.suites[].arn'); do
+              SUITE_NAME=$(echo "$SUITES" | jq -r --arg arn "$SUITE_ARN" '.suites[] | select(.arn == $arn) | .name // "unknown"')
+              SAFE_SUITE=$(echo "$SUITE_NAME" | tr ' /' '__' | tr -cd '[:alnum:]_-')
+
+              ARTIFACTS=$(aws devicefarm list-artifacts --arn "$SUITE_ARN" --type FILE --output json 2>/dev/null || echo '{"artifacts":[]}')
+
+              echo "$ARTIFACTS" | jq -c '.artifacts[]' 2>/dev/null | while read -r ARTIFACT; do
+                ART_NAME=$(echo "$ARTIFACT" | jq -r '.name // "unknown"')
+                ART_URL=$(echo "$ARTIFACT" | jq -r '.url // empty')
+                ART_EXT=$(echo "$ARTIFACT" | jq -r '.extension // "txt"')
+                [ -z "$ART_URL" ] && continue
+
+                if [ "$PLATFORM" = "Android" ]; then
+                  if echo "$ART_NAME" | grep -qiE "^video$" || echo "$ART_EXT" | grep -qiE "^mp4$"; then
+                    echo "  Skipped (video): $SUITE_NAME / $ART_NAME"
+                    continue
+                  fi
+                fi
+
+                SAFE_ART=$(echo "$ART_NAME" | tr ' /' '__' | tr -cd '[:alnum:]_-')
+                DEST="$LOG_DIR/${SAFE_RUN}_${SAFE_NAME}_${SAFE_SUITE}_${SAFE_ART}.${ART_EXT}"
+
+                if curl -fsSL -o "$DEST" "$ART_URL" 2>/dev/null; then
+                  echo "  Downloaded: $SUITE_NAME / $ART_NAME"
+
+                  if echo "$ART_NAME" | grep -qiE "test.spec|testspec"; then
+                    echo ""
+                    echo "::group::📋 [$DEVICE_NAME] $SUITE_NAME — $ART_NAME"
+                    cat "$DEST" 2>/dev/null || true
+                    echo "::endgroup::"
+                  fi
+                fi
+              done
+
+              LOG_ARTIFACTS=$(aws devicefarm list-artifacts --arn "$SUITE_ARN" --type LOG --output json 2>/dev/null || echo '{"artifacts":[]}')
+
+              echo "$LOG_ARTIFACTS" | jq -c '.artifacts[]' 2>/dev/null | while read -r ARTIFACT; do
+                ART_NAME=$(echo "$ARTIFACT" | jq -r '.name // "unknown"')
+                ART_URL=$(echo "$ARTIFACT" | jq -r '.url // empty')
+                ART_EXT=$(echo "$ARTIFACT" | jq -r '.extension // "txt"')
+                [ -z "$ART_URL" ] && continue
+
+                SAFE_ART=$(echo "$ART_NAME" | tr ' /' '__' | tr -cd '[:alnum:]_-')
+                DEST="$LOG_DIR/${SAFE_RUN}_${SAFE_NAME}_${SAFE_SUITE}_${SAFE_ART}.${ART_EXT}"
+
+                if curl -fsSL -o "$DEST" "$ART_URL" 2>/dev/null; then
+                  echo "  Downloaded: $SUITE_NAME / $ART_NAME (LOG)"
+                fi
+              done
+            done
+
+            JOB_ARTIFACTS=$(aws devicefarm list-artifacts --arn "$JOB_ARN" --type FILE --output json 2>/dev/null || echo '{"artifacts":[]}')
+            echo "$JOB_ARTIFACTS" | jq -c '.artifacts[]' 2>/dev/null | while read -r ARTIFACT; do
+              ART_NAME=$(echo "$ARTIFACT" | jq -r '.name // "unknown"')
+              ART_URL=$(echo "$ARTIFACT" | jq -r '.url // empty')
+              ART_EXT=$(echo "$ARTIFACT" | jq -r '.extension // "txt"')
+              [ -z "$ART_URL" ] && continue
+
+              if [ "$PLATFORM" = "Android" ]; then
+                if echo "$ART_NAME" | grep -qiE "^video$" || echo "$ART_EXT" | grep -qiE "^mp4$"; then
+                  echo "  Skipped (video): job-level / $ART_NAME"
+                  continue
+                fi
+              fi
+
+              SAFE_ART=$(echo "$ART_NAME" | tr ' /' '__' | tr -cd '[:alnum:]_-')
+              DEST="$LOG_DIR/${SAFE_RUN}_${SAFE_NAME}_job_${SAFE_ART}.${ART_EXT}"
+
+              if curl -fsSL -o "$DEST" "$ART_URL" 2>/dev/null; then
+                echo "  Downloaded (job-level): $ART_NAME"
+              fi
+            done
+          done
+
+          echo ""
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          echo "📦 All downloaded logs:"
+          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
+          find "$LOG_DIR" -type f -exec ls -lh {} \; 2>/dev/null || echo "  (no logs downloaded)"
+
+      - name: Upload Device Farm Logs
+        if: always() && steps.schedule_run.outputs.run_arn
+        uses: actions/upload-artifact@v4
+        with:
+          name: devicefarm-logs-classification-ggml-${{ matrix.platform }}
+          path: devicefarm-logs/
+          retention-days: 30
+          if-no-files-found: ignore
diff --git a/.github/workflows/integration-test-classification-ggml.yml b/.github/workflows/integration-test-classification-ggml.yml
new file mode 100644
index 0000000000..43c076ea61
--- /dev/null
+++ b/.github/workflows/integration-test-classification-ggml.yml
@@ -0,0 +1,178 @@
+name: Integration Tests (GGML Classification)
+
+on:
+  workflow_dispatch:
+    inputs:
+      prebuild_package:
+        description: "NPM package containing prebuilds (e.g. @qvac/classification-ggml@0.1.0)"
+        required: false
+        type: string
+  workflow_call:
+    inputs:
+      ref:
+        description: "ref"
+        type: string
+        required: false
+      repository:
+        type: string
+        required: false
+        default: "tetherto/qvac"
+      workdir:
+        description: "Working directory inside the repo (monorepo package path)"
+        type: string
+        required: false
+        default: "packages/classification-ggml"
+      prebuild_package:
+        description: "NPM package containing prebuilds (e.g. @qvac/classification-ggml@0.1.0). When set, prebuilds are downloaded from npm instead of from per-PR build artifacts."
+        type: string
+        required: false
+
+env:
+  PKG_DIR: packages/classification-ggml
+
+jobs:
+  run-integration-tests:
+    timeout-minutes: 30
+    runs-on: ${{ matrix.os }}
+    environment: release
+    name: ${{ matrix.platform }}-${{ matrix.arch }}-integration-tests
+    permissions:
+      contents: read
+      packages: read
+      id-token: write
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-22.04
+            platform: linux
+            arch: x64
+          - os: ubuntu-24.04
+            platform: linux
+            arch: x64
+          - os: ubuntu-22.04-arm
+            platform: linux
+            arch: arm64
+          - os: macos-14
+            platform: darwin
+            arch: arm64
+          - os: windows-2022
+            platform: win32
+            arch: x64
+
+    steps:
+      - name: Setup Node.js
+        uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # 6.3.0
+        with:
+          node-version: lts/*
+
+      - name: Windows — enable git long paths
+        if: ${{ matrix.platform == 'win32' }}
+        shell: bash
+        run: git config --system core.longpaths true
+
+      - name: Checkout code
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+        with:
+          repository: ${{ inputs.repository || github.repository }}
+          ref: ${{ inputs.ref || github.ref }}
+          token: ${{ secrets.PAT_TOKEN }}
+
+      - name: Setup Bare runtime
+        uses: tetherto/qvac/.github/actions/setup-bare-tooling@0bbdca93da303a0b1634ba14a89cec085621078d
+
+      - name: Install npm dependencies
+        working-directory: ${{ env.PKG_DIR }}
+        run: npm install --ignore-scripts
+
+      - name: Download prebuild artifacts
+        if: ${{ !inputs.prebuild_package }}
+        uses: actions/download-artifact@3e5f45b2cfb9172054b4087a40e8e0b5a5461e7c # 8.0.1
+        with:
+          pattern: classification-ggml-${{ matrix.platform }}-${{ matrix.arch }}*
+          path: ${{ env.PKG_DIR }}/prebuilds
+          merge-multiple: true
+
+      - name: Download prebuilds from package (Linux/macOS)
+        if: ${{ inputs.prebuild_package && matrix.platform != 'win32' }}
+        working-directory: ${{ env.PKG_DIR }}
+        shell: bash
+        run: |
+          PACKAGE="${{ inputs.prebuild_package }}"
+          echo "Downloading $PACKAGE from npm..."
+
+          if ! npm pack "$PACKAGE" --ignore-scripts; then
+            echo "ERROR: Failed to download $PACKAGE from npm"
+            echo "Please check that the package exists"
+            exit 1
+          fi
+
+          tar -xzf *.tgz
+
+          if [ ! -d "package/prebuilds" ]; then
+            echo "ERROR: No prebuilds directory found in package"
+            echo "The downloaded package may not contain prebuilt binaries"
+            exit 1
+          fi
+
+          mv package/prebuilds ./prebuilds
+          rm -rf package *.tgz
+
+          echo "Prebuilds downloaded from npm successfully"
+          ls -la prebuilds/
+
+      - name: Download prebuilds from package (Windows)
+        if: ${{ inputs.prebuild_package && matrix.platform == 'win32' }}
+        working-directory: ${{ env.PKG_DIR }}
+        shell: powershell
+        run: |
+          $PACKAGE = "${{ inputs.prebuild_package }}"
+          echo "Downloading $PACKAGE from npm..."
+
+          npm pack $PACKAGE --ignore-scripts
+          if ($LASTEXITCODE -ne 0) {
+            echo "ERROR: Failed to download $PACKAGE from npm"
+            echo "Please check that the package exists"
+            exit 1
+          }
+
+          $TARBALL = Get-ChildItem -Filter "*.tgz" | Select-Object -First 1 -ExpandProperty Name
+          if (-not $TARBALL) {
+            echo "ERROR: Could not find downloaded tarball"
+            exit 1
+          }
+
+          echo "Extracting $TARBALL..."
+          tar -xzf $TARBALL
+
+          if (-not (Test-Path "package/prebuilds")) {
+            echo "ERROR: No prebuilds directory found in package"
+            echo "The downloaded package may not contain prebuilt binaries"
+            exit 1
+          }
+
+          Move-Item package/prebuilds ./prebuilds
+          Remove-Item -Recurse -Force package
+          Remove-Item $TARBALL
+
+          echo "Prebuilds downloaded from npm successfully"
+          Get-ChildItem prebuilds/
+
+      - name: Run JS integration tests
+        working-directory: ${{ env.PKG_DIR }}
+        env:
+          # Opt in to the C++ per-inference trace so CI logs contain
+          # raw logits / probs / sorted results for every classification.
+          # Invaluable for debugging platform-specific numerical issues
+          # (noise is bounded to a few lines per sample image).
+          QVAC_CLASSIFICATION_TRACE: "1"
+        run: npm run test:integration
+
+      - name: Upload performance report
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # 4.6.2
+        with:
+          name: classification-perf-report-${{ matrix.platform }}-${{ matrix.arch }}
+          path: ${{ env.PKG_DIR }}/test/results/performance-report.json
+          if-no-files-found: ignore
+          retention-days: 30
diff --git a/.github/workflows/on-merge-classification-ggml.yml b/.github/workflows/on-merge-classification-ggml.yml
new file mode 100644
index 0000000000..f43dc2d1bc
--- /dev/null
+++ b/.github/workflows/on-merge-classification-ggml.yml
@@ -0,0 +1,218 @@
+name: On Merge Trigger (Classification-ggml)
+
+on:
+  push:
+    branches:
+      - main
+      - release-*
+      - feature-*
+      - tmp-*
+    paths:
+      - "packages/classification-ggml/**"
+      - ".github/workflows/*classification-ggml*.yml"
+  workflow_dispatch:
+    inputs:
+      tag:
+        description: "Tag to publish with"
+        required: false
+        default: "dev"
+        type: choice
+        options:
+          - latest
+          - dev
+      npm_tag:
+        description: "NPM dist-tag (default: latest). e.g. release-1.x"
+        required: false
+        default: ""
+        type: string
+
+permissions:
+  contents: read
+  pull-requests: read
+  packages: read
+  id-token: write
+
+jobs:
+  publish-logic:
+    runs-on: ubuntu-latest
+    outputs:
+      publish_main: ${{ steps.logic.outputs.publish_main }}
+      publish_release: ${{ steps.logic.outputs.publish_release }}
+      publish_feature: ${{ steps.logic.outputs.publish_feature }}
+      publish_tmp: ${{ steps.logic.outputs.publish_tmp }}
+      gpr_tag: ${{ steps.logic.outputs.gpr_tag }}
+    steps:
+      - id: logic
+        shell: bash
+        env:
+          INPUT_TAG: ${{ inputs.tag }}
+        run: |
+          set -euo pipefail
+          ref_name="${GITHUB_REF_NAME}"
+          event_name="${GITHUB_EVENT_NAME}"
+          input_tag="${INPUT_TAG}"
+
+          publish_main="false"
+          publish_release="false"
+          publish_feature="false"
+          publish_tmp="false"
+
+          if [ "$event_name" = "push" ] || [ "$event_name" = "workflow_dispatch" ]; then
+            if [ "$ref_name" = "main" ]; then
+              publish_main="true"
+            elif [[ "$ref_name" == release-* ]]; then
+              publish_release="true"
+            elif [[ "$ref_name" == feature-* ]]; then
+              publish_feature="true"
+            elif [[ "$ref_name" == tmp-* ]]; then
+              publish_tmp="true"
+            fi
+          fi
+
+          gpr_tag="$input_tag"
+          if [ -z "$gpr_tag" ]; then
+            if [ "$ref_name" = "main" ]; then
+              gpr_tag="dev"
+            elif [[ "$ref_name" == feature-* ]]; then
+              gpr_tag="feature"
+            elif [[ "$ref_name" == tmp-* ]]; then
+              gpr_tag="temp"
+            else
+              gpr_tag="dev"
+            fi
+          fi
+
+          echo "publish_main=$publish_main" >> "$GITHUB_OUTPUT"
+          echo "publish_release=$publish_release" >> "$GITHUB_OUTPUT"
+          echo "publish_feature=$publish_feature" >> "$GITHUB_OUTPUT"
+          echo "publish_tmp=$publish_tmp" >> "$GITHUB_OUTPUT"
+          echo "gpr_tag=$gpr_tag" >> "$GITHUB_OUTPUT"
+
+  release-merge-guard:
+    name: Release Merge Guard
+    if: >-
+      (github.event_name == 'push' || github.event_name == 'workflow_dispatch') &&
+      startsWith(github.ref_name, 'release-')
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+        with:
+          fetch-depth: 0
+      - uses: ./.github/actions/release-merge-guard
+        with:
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+          base-ref: ${{ github.ref_name }}
+          base-sha: ${{ github.event.before }}
+          head-sha: ${{ github.sha }}
+          package-slug: classification-ggml
+          package-json-path: packages/classification-ggml/package.json
+          changelog-path: packages/classification-ggml/CHANGELOG.md
+
+  run-integration-tests:
+    needs: publish-logic
+    if: |
+      needs.publish-logic.outputs.publish_main == 'true' ||
+      needs.publish-logic.outputs.publish_release == 'true' ||
+      needs.publish-logic.outputs.publish_feature == 'true' ||
+      needs.publish-logic.outputs.publish_tmp == 'true'
+    uses: ./.github/workflows/integration-test-classification-ggml.yml
+    secrets: inherit
+    with:
+      repository: ${{ github.repository }}
+      ref: ${{ github.sha }}
+      workdir: "packages/classification-ggml"
+
+  mobile-integration-tests:
+    needs: publish-logic
+    permissions:
+      contents: read
+      packages: read
+      pull-requests: write
+      id-token: write
+    if: |
+      needs.publish-logic.outputs.publish_main == 'true' ||
+      needs.publish-logic.outputs.publish_release == 'true' ||
+      needs.publish-logic.outputs.publish_feature == 'true' ||
+      needs.publish-logic.outputs.publish_tmp == 'true'
+    uses: ./.github/workflows/integration-mobile-test-classification-ggml.yml
+    secrets: inherit
+    with:
+      repository: ${{ github.repository }}
+      ref: ${{ github.sha }}
+
+  publish-gpr:
+    needs: [publish-logic, run-integration-tests, mobile-integration-tests]
+    if: |
+      needs.publish-logic.outputs.publish_main == 'true' ||
+      needs.publish-logic.outputs.publish_feature == 'true' ||
+      needs.publish-logic.outputs.publish_tmp == 'true'
+    runs-on: ubuntu-latest
+    environment: release
+    permissions:
+      contents: write
+      packages: write
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+        with:
+          fetch-depth: 0
+
+      - name: Publish to GitHub Packages
+        uses: ./.github/actions/publish-library-to-gpr
+        with:
+          secret-token: ${{ secrets.GITHUB_TOKEN }}
+          npm-token: ${{ secrets.NPM_TOKEN }}
+          tag: ${{ needs.publish-logic.outputs.gpr_tag }}
+          workdir: "packages/classification-ggml"
+          name-suffix: "-mono"
+
+  publish-release-npm:
+    needs: [publish-logic, release-merge-guard, run-integration-tests, mobile-integration-tests]
+    if: |
+      !cancelled() &&
+      needs.publish-logic.outputs.publish_release == 'true' &&
+      needs.release-merge-guard.result == 'success'
+    runs-on: ubuntu-latest
+    environment: release
+    outputs:
+      published_version: ${{ steps.publish.outputs.npm_published_version }}
+    permissions:
+      contents: write
+      packages: write
+      id-token: write
+    steps:
+      - name: Validate npm_tag input
+        if: inputs.npm_tag != ''
+        shell: bash
+        run: |
+          tag="${{ inputs.npm_tag }}"
+          if ! echo "$tag" | grep -qE '^[a-zA-Z0-9][a-zA-Z0-9._-]*$'; then
+            echo "::error::Invalid npm dist-tag '$tag'. Must match ^[a-zA-Z0-9][a-zA-Z0-9._-]*$ (e.g. release-1.x)"
+            exit 1
+          fi
+
+      - name: Checkout repository
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+
+      - name: Publish to NPM Package Registry
+        id: publish
+        uses: ./.github/actions/publish-library-to-npm
+        with:
+          tag: ${{ inputs.npm_tag || 'latest' }}
+          workdir: "packages/classification-ggml"
+
+  publish-release:
+    needs: [publish-release-npm]
+    if: |
+      !cancelled() &&
+      needs.publish-release-npm.result == 'success' &&
+      needs.publish-release-npm.outputs.published_version != ''
+    permissions:
+      contents: write
+    uses: ./.github/workflows/create-github-release.yml
+    with:
+      repo_name: "classification-ggml"
+      release_name: "QVAC GGML Image Classification Lib"
+      published_version: ${{ needs.publish-release-npm.outputs.published_version }}
+      prev_sha: ${{ github.event.before }}
+      workdir: "packages/classification-ggml"
diff --git a/.github/workflows/on-pr-classification-ggml.yml b/.github/workflows/on-pr-classification-ggml.yml
new file mode 100644
index 0000000000..49a3df1821
--- /dev/null
+++ b/.github/workflows/on-pr-classification-ggml.yml
@@ -0,0 +1,192 @@
+name: On PR Trigger (Classification-ggml)
+
+on:
+  pull_request_target:
+    types:
+      - opened
+      - synchronize
+      - reopened
+      - labeled
+    branches:
+      - main
+      - release-*
+      - feature-*
+      - tmp-*
+    paths:
+      - "packages/classification-ggml/**"
+      - ".github/workflows/*classification-ggml*.yml"
+  workflow_dispatch:
+
+permissions:
+  contents: read
+  pull-requests: read
+  packages: read
+  id-token: write
+
+env:
+  PKG_DIR: packages/classification-ggml
+
+jobs:
+  authorize:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      pull-requests: write
+    outputs:
+      allowed: ${{ steps.auth.outputs.allowed }}
+    steps:
+      - name: Checkout
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+      - name: Authorize
+        id: auth
+        uses: ./.github/actions/authorize-pr
+        with:
+          github-token: ${{ github.token }}
+
+  changes:
+    if: github.event_name != 'workflow_dispatch'
+    runs-on: ubuntu-latest
+    outputs:
+      pkg: ${{ steps.filter.outputs.pkg }}
+    steps:
+      - uses: dorny/paths-filter@fbd0ab8f3e69293af611ebaee6363fc25e6d187d # 4.0.1
+        id: filter
+        with:
+          token: ${{ secrets.GITHUB_TOKEN }}
+          filters: |
+            pkg:
+              - "packages/classification-ggml/**"
+              - ".github/workflows/*classification-ggml*.yml"
+
+  sanity-checks:
+    needs: [authorize, changes]
+    if: always() && ((needs.changes.outputs.pkg == 'true' && needs.authorize.outputs.allowed == 'true') || github.event_name == 'workflow_dispatch')
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+        with:
+          fetch-depth: 0
+
+      - name: Run Sanity checks
+        uses: ./.github/actions/sanity-checks
+        with:
+          secret-token: ${{ secrets.GITHUB_TOKEN }}
+          pat-token: ${{ secrets.PAT_TOKEN }}
+          run-integration: ${{ needs.authorize.outputs.allowed == 'true' }}
+          workdir: packages/classification-ggml
+
+  ts-checks:
+    needs: [authorize, changes, sanity-checks]
+    if: always() && needs.authorize.outputs.allowed == 'true' && (needs.changes.outputs.pkg == 'true' || github.event_name == 'workflow_dispatch')
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        working-directory: ${{ env.PKG_DIR }}
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # 6.0.2
+      - name: Set up Node.js
+        uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # 6.3.0
+        with:
+          node-version: 20
+      - name: Install dependencies
+        run: npm install --ignore-scripts
+      - name: Type declaration check
+        run: npm run test:dts
+
+  cpp-lint:
+    needs: [authorize, changes, sanity-checks]
+    if: |
+      always() &&
+       needs.authorize.outputs.allowed == 'true' &&
+      (needs.changes.outputs.pkg == 'true' || github.event_name == 'workflow_dispatch')
+    uses: ./.github/workflows/cpp-lint.yaml
+    secrets: inherit
+    with:
+      sha: ${{ github.event.pull_request.base.sha || github.event.before || 'HEAD~1' }}
+      pr_head_sha: ${{ github.event.pull_request.head.sha || github.sha }}
+      workdir: packages/classification-ggml
+
+  cpp-tests:
+    needs: [authorize, changes, sanity-checks]
+    if: |
+      always() &&
+      needs.authorize.outputs.allowed == 'true' &&
+      (needs.changes.outputs.pkg == 'true' || github.event_name == 'workflow_dispatch')
+    uses: ./.github/workflows/cpp-tests-classification.yml
+    secrets: inherit
+    with:
+      workdir: packages/classification-ggml
+      repository: ${{ github.event.pull_request.head.repo.full_name }}
+      ref: ${{ github.event.pull_request.head.ref }}
+
+  prebuild:
+    permissions:
+      contents: write
+      packages: write
+      pull-requests: write
+      id-token: write
+    needs: [authorize, changes, sanity-checks]
+    if: |
+      always() &&
+      needs.authorize.outputs.allowed == 'true' &&
+      (needs.changes.outputs.pkg == 'true' || github.event_name == 'workflow_dispatch')
+    uses: ./.github/workflows/prebuilds-classification-ggml.yml
+    secrets: inherit
+    with:
+      repository: ${{ github.event.pull_request.head.repo.full_name }}
+      ref: ${{ github.event.pull_request.head.ref }}
+
+  run-integration-tests:
+    needs: [authorize, changes, sanity-checks, prebuild]
+    if: |
+      always() &&
+      needs.authorize.outputs.allowed == 'true' &&
+      (needs.changes.outputs.pkg == 'true' || github.event_name == 'workflow_dispatch')
+    permissions:
+      contents: read
+      packages: read
+      id-token: write
+    uses: ./.github/workflows/integration-test-classification-ggml.yml
+    secrets: inherit
+    with:
+      repository: ${{ github.event.pull_request.head.repo.full_name }}
+      ref: ${{ github.event.pull_request.head.ref }}
+
+  run-mobile-integration-tests:
+    permissions:
+      contents: read
+      packages: read
+      pull-requests: write # Allow commenting on PRs
+      id-token: write
+    needs: [authorize, changes, sanity-checks, prebuild]
+    if: |
+      always() &&
+      needs.authorize.outputs.allowed == 'true' &&
+      (needs.changes.outputs.pkg == 'true' || github.event_name == 'workflow_dispatch')
+    uses: ./.github/workflows/integration-mobile-test-classification-ggml.yml
+    secrets: inherit
+    with:
+      repository: ${{ github.event.pull_request.head.repo.full_name }}
+      ref: ${{ github.event.pull_request.head.ref }}
+
+  merge-guard:
+    needs:
+      [
+        authorize,
+        changes,
+        sanity-checks,
+        ts-checks,
+        cpp-lint,
+        cpp-tests,
+        prebuild,
+        run-integration-tests,
+        run-mobile-integration-tests,
+      ]
+    if: always() && (needs.changes.outputs.pkg == 'true' || github.event_name == 'workflow_dispatch')
+    uses: ./.github/workflows/public-pr.yml
+    with:
+      sanity-checks-status: ${{ needs.sanity-checks.result == 'success' && needs.ts-checks.result == 'success' && needs.cpp-lint.result == 'success' && needs.cpp-tests.result == 'success' }}
+      build-status: ${{ needs.prebuild.result == 'success' }}
+      integration-tests-status: ${{ (needs.run-integration-tests.result == 'success' || needs.run-integration-tests.result == 'skipped') && (needs.run-mobile-integration-tests.result == 'success' || needs.run-mobile-integration-tests.result == 'skipped') }}
diff --git a/.github/workflows/on-pr-close-classification-ggml.yml b/.github/workflows/on-pr-close-classification-ggml.yml
new file mode 100644
index 0000000000..f2569f568c
--- /dev/null
+++ b/.github/workflows/on-pr-close-classification-ggml.yml
@@ -0,0 +1,66 @@
+name: On PR Close (Classification-ggml)
+
+on:
+  pull_request:
+    types:
+      - closed
+    paths:
+      - "packages/classification-ggml/**"
+      - ".github/workflows/*classification-ggml*.yml"
+  workflow_dispatch:
+    inputs:
+      version:
+        description: "Specific version to target for deletion"
+        required: false
+        type: string
+      pr-number:
+        description: "PR number to target for deletion"
+        required: false
+        type: string
+      pattern:
+        description: "Pattern to target for deletion"
+        required: false
+        type: string
+      packages:
+        description: "Packages to target for deletion, space separated"
+        required: false
+        type: string
+        default: "classification-ggml"
+      dry-run:
+        description: "Is dry run? If true, lists versions without deleting."
+        type: boolean
+        default: true
+
+run-name: >-
+  Delete NPM Versions (classification-ggml)
+  v=${{ inputs.version }}
+  pr=${{ github.event_name == 'pull_request' && github.event.pull_request.number || inputs.pr-number }}
+  dry=${{ github.event_name == 'pull_request' && true || inputs.dry-run }}
+
+permissions:
+  contents: read
+
+jobs:
+  print-context:
+    runs-on: ubuntu-latest
+    continue-on-error: true
+    steps:
+      - run: |
+          echo "Inputs Context: $INPUTS_CONTEXT"
+        env:
+          INPUTS_CONTEXT: ${{ toJSON(inputs) }}
+      - run: |
+          echo "GitHub Context: $GITHUB_CONTEXT"
+        env:
+          GITHUB_CONTEXT: ${{ toJSON(github) }}
+
+  delete-npm-versions-trigger:
+    permissions:
+      packages: write
+    uses: ./.github/workflows/public-delete-npm-versions.yml
+    with:
+      version: ${{ inputs.version }}
+      pr-number: ${{ github.event_name == 'pull_request' && github.event.pull_request.number || inputs.pr-number }}
+      pattern: ${{ inputs.pattern }}
+      packages: ${{ inputs.packages || 'classification-ggml' }}
+      dry-run: ${{ github.event_name == 'pull_request' && true || inputs.dry-run }}
diff --git a/.github/workflows/prebuilds-classification-ggml.yml b/.github/workflows/prebuilds-classification-ggml.yml
new file mode 100644
index 0000000000..d5d304e70b
--- /dev/null
+++ b/.github/workflows/prebuilds-classification-ggml.yml
@@ -0,0 +1,44 @@
+# Build-only workflow. Publishing lives in on-merge-classification-ggml.yml.
+name: Prebuilds (GGML Classification)
+
+on:
+  workflow_dispatch:
+    inputs:
+      workdir:
+        description: "Working directory (optional)"
+        required: false
+        type: string
+        default: "packages/classification-ggml"
+
+  workflow_call:
+    inputs:
+      ref:
+        description: "ref"
+        type: string
+        required: false
+      repository:
+        type: string
+        required: false
+        default: "tetherto/qvac"
+      workdir:
+        description: "Working directory (optional)"
+        required: false
+        type: string
+        default: "packages/classification-ggml"
+
+permissions:
+  contents: read
+
+jobs:
+  prebuild:
+    permissions:
+      contents: write
+      pull-requests: write
+      id-token: write
+    uses: ./.github/workflows/reusable-prebuilds.yml
+    with:
+      workdir: ${{ inputs.workdir }}
+      ref: ${{ inputs.ref }}
+      repository: ${{ inputs.repository }}
+      artifact-name-prefix: classification-ggml-
+    secrets: inherit
diff --git a/packages/classification-ggml/.gitignore b/packages/classification-ggml/.gitignore
new file mode 100644
index 0000000000..1a1004453c
--- /dev/null
+++ b/packages/classification-ggml/.gitignore
@@ -0,0 +1,26 @@
+node_modules/
+package-lock.json
+build/
+prebuilds/
+dist/
+vcpkg_installed/
+.vcpkg/
+vcpkg/buildtrees/
+vcpkg/downloads/
+vcpkg/packages/
+vcpkg/installed/
+compile_commands.json
+.clang-format
+.clang-tidy
+.valgrind.supp
+*.log
+
+# Auto-generated performance report from local test runs (CI uploads its own).
+test/results/
+
+# Internal validation set (confidential, must never be committed).
+test/images/internal/
+proposal/dataset_val/
+
+# Device Farm logs downloaded for local diagnostic; never committed.
+remote_logs/
diff --git a/packages/classification-ggml/CHANGELOG.md b/packages/classification-ggml/CHANGELOG.md
new file mode 100644
index 0000000000..f243c3fb73
--- /dev/null
+++ b/packages/classification-ggml/CHANGELOG.md
@@ -0,0 +1,52 @@
+# Changelog
+
+All notable changes to `@qvac/classification-ggml` will be documented in
+this file.
+
+The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
+and this project adheres to
+[Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+
+## [0.1.0] — Unreleased
+
+### Added
+
+- Initial release of the GGML image classification addon.
+- `ImageClassifier` public API (`load`, `classify`, `unload`) orchestrated
+  via `@qvac/infer-base`'s `createJobHandler` + `exclusiveRunQueue`,
+  mirroring the lifecycle pattern used by `@qvac/llm-llamacpp`.
+- C++ `ClassificationModel` implementing the MobileNetV3-Small architecture
+  directly against `libggml` (34 conv + 2 linear layers, with depthwise
+  separable convolutions, HardSwish activations, and squeeze-and-excite
+  blocks). BatchNorm is folded into the preceding convolution at load time
+  via `foldBn()` (`eps = 0.001`); the runtime graph evaluates only the
+  resulting scale/shift, with no per-inference BN op.
+- FP16 GGUF weights (2.94 MB) bundled in `weights/` and loaded with
+  `gguf_init_from_file()` + `ggml_backend_tensor_set()`.
+- Image preprocessing pipeline: JPEG / PNG decode via `stb_image`, bilinear
+  resize to 224x224, ImageNet-normalization, WHCN tensor layout.
+- Integration tests (brittle + bare) covering happy path, raw-RGB input,
+  edge cases, and lifecycle errors.
+- C++ unit tests (GoogleTest) covering graph construction, BN epsilon,
+  softmax normalization, and FP16 weight loading.
+- ONNX-to-GGUF conversion guide in `docs/onnx-to-gguf-conversion.md`.
+- `nativeLogger` constructor option (default `false`) that gates the shared
+  native C++→JS logger bridge; off by default because the underlying
+  `qvac-lib-inference-addon-cpp` `JsLogger` singleton's static `uv_async_t`
+  lifecycle is not safe across rapid create/destroy cycles. JS-level
+  logging always routes through the caller's `logger`.
+
+### Removed
+
+- `threads` constructor option. libggml's CPU thread pool now sizes itself
+  to `std::thread::hardware_concurrency` on every platform. The knob was
+  unimplementable on Android (the `ggml_backend_cpu_set_n_threads` symbol
+  lives inside the per-microarch CPU variant `.so` loaded via `dlopen`,
+  not in the addon's statically-linked `.bare`), and exposing it only on
+  desktop / iOS would have produced silently inconsistent behaviour across
+  platforms. Removed for API consistency.
+
+> **Note.** SDK plugin / schema integration (canonical model type
+> `ggml-classification` with `classification` alias) is **out of scope** for
+> 0.1.0 and will land in a follow-up PR; see the PR description for the
+> rationale.
diff --git a/packages/classification-ggml/CMakeLists.txt b/packages/classification-ggml/CMakeLists.txt
new file mode 100644
index 0000000000..0dec551734
--- /dev/null
+++ b/packages/classification-ggml/CMakeLists.txt
@@ -0,0 +1,130 @@
+cmake_minimum_required(VERSION 3.25)
+
+option(BUILD_TESTING "Build tests" OFF)
+option(ENABLE_COVERAGE "Enable coverage instrumentation for unit tests" OFF)
+if(BUILD_TESTING)
+  list(APPEND VCPKG_MANIFEST_FEATURES "tests")
+endif()
+
+find_package(cmake-bare REQUIRED PATHS node_modules/cmake-bare)
+find_package(cmake-vcpkg REQUIRED PATHS node_modules/cmake-vcpkg)
+
+set(VCPKG_OVERLAY_TRIPLETS "${CMAKE_CURRENT_SOURCE_DIR}/vcpkg/triplets;${VCPKG_OVERLAY_TRIPLETS}")
+
+# Android STL configuration must be set before project()
+if(DEFINED ENV{ANDROID_NDK} OR DEFINED ENV{ANDROID_NDK_HOME})
+  set(ANDROID_STL c++_shared)
+endif()
+
+project(classification-ggml LANGUAGES C CXX)
+
+if(CMAKE_SYSTEM_NAME STREQUAL "Linux")
+  add_compile_options(-stdlib=libc++)
+  add_link_options(-stdlib=libc++ -static-libstdc++)
+endif()
+
+find_path(VCPKG_INSTALLED_PATH share/lint-cpp/.clang-format REQUIRED)
+configure_file(${VCPKG_INSTALLED_PATH}/share/lint-cpp/.clang-format
+               ${CMAKE_CURRENT_SOURCE_DIR}/.clang-format COPYONLY)
+configure_file(${VCPKG_INSTALLED_PATH}/share/lint-cpp/.clang-tidy
+               ${CMAKE_CURRENT_SOURCE_DIR}/.clang-tidy COPYONLY)
+
+set(CMAKE_CXX_STANDARD 20)
+set(CMAKE_CXX_EXTENSIONS OFF)
+set(CMAKE_POSITION_INDEPENDENT_CODE ON)
+set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
+
+if(WIN32)
+  add_definitions(-DWIN32_LEAN_AND_MEAN -DNOMINMAX -DNOGDI)
+endif()
+
+find_path(QVAC_LIB_INFERENCE_ADDON_CPP_INCLUDE_DIRS
+  "inference-addon-cpp/JsInterface.hpp" REQUIRED)
+find_path(STB_INCLUDE_DIRS "stb_image.h" REQUIRED)
+
+find_package(ggml CONFIG REQUIRED)
+
+bare_target(bare_target_value)
+bare_module_target("." unused_target NAME module_name VERSION unused_version)
+set(BACKENDS_SUBDIR_VALUE "${bare_target_value}/${module_name}")
+message(STATUS "Building classification-ggml with BACKENDS_SUBDIR='${BACKENDS_SUBDIR_VALUE}'")
+
+set(BACKEND_DL_LIBS "")
+if((ANDROID OR UNIX) AND NOT APPLE)
+  foreach(_backend ${GGML_AVAILABLE_BACKENDS})
+    # GGML_AVAILABLE_BACKENDS advertises every backend the upstream port
+    # knows about, but real CMake targets only exist for those actually
+    # built into the installed package (e.g. ggml-vulkan / ggml-opencl
+    # are absent on Android with our vcpkg feature set). Skip missing
+    # ones so add_bare_module's get_target_property() doesn't error out.
+    if(TARGET ggml::${_backend})
+      list(APPEND BACKEND_DL_LIBS INSTALL TARGET ggml::${_backend})
+    endif()
+  endforeach()
+endif()
+
+add_bare_module(classification-ggml EXPORTS ${BACKEND_DL_LIBS})
+
+if(CMAKE_SYSTEM_NAME STREQUAL "Linux")
+  target_link_options(${classification-ggml}_module PRIVATE -Wl,--exclude-libs,ALL)
+endif()
+
+set(ADDON_SOURCES
+  ${PROJECT_SOURCE_DIR}/addon/src/js-interface/binding.cpp
+  ${PROJECT_SOURCE_DIR}/addon/src/model-interface/ClassificationModel.cpp
+  ${PROJECT_SOURCE_DIR}/addon/src/model-interface/ImagePreprocessor.cpp
+  ${PROJECT_SOURCE_DIR}/addon/src/model-interface/MobileNetGraph.cpp
+)
+
+target_sources(
+  ${classification-ggml}
+  PRIVATE
+    ${ADDON_SOURCES}
+)
+
+target_include_directories(
+  ${classification-ggml}
+  PRIVATE
+    ${QVAC_LIB_INFERENCE_ADDON_CPP_INCLUDE_DIRS}
+    ${STB_INCLUDE_DIRS}
+    ${PROJECT_SOURCE_DIR}/addon/src
+)
+
+target_link_libraries(
+  ${classification-ggml}
+  PRIVATE
+    ggml::ggml
+    ggml::ggml-base
+)
+
+# CPU backend: with GGML_CPU_ALL_VARIANTS=ON (Android via qvac-fabric),
+# the single ggml::ggml-cpu target doesn't exist — it's replaced by
+# per-microarch variants (ggml::ggml-cpu-android_armv8.0_1, ...armv8.2_1,
+# ...armv8.2_2, ...armv8.6_1) loaded as MODULE .so files at runtime via
+# dlopen. On Apple/Linux/Windows desktop where variants are off,
+# ggml::ggml-cpu exists as a single static target.
+if(TARGET ggml::ggml-cpu)
+  target_link_libraries(${classification-ggml} PRIVATE ggml::ggml-cpu)
+endif()
+
+target_compile_definitions(
+  ${classification-ggml}
+  PRIVATE
+    JS_LOGGER
+    BACKENDS_SUBDIR="${BACKENDS_SUBDIR_VALUE}"
+)
+
+if(WIN32)
+  target_link_libraries(
+    ${classification-ggml}
+    PRIVATE
+      msvcrt.lib
+  )
+endif()
+
+if(BUILD_TESTING)
+  find_package(GTest CONFIG REQUIRED)
+  include(GoogleTest)
+  enable_testing()
+  add_subdirectory(test/unit)
+endif()
diff --git a/packages/classification-ggml/LICENSE b/packages/classification-ggml/LICENSE
new file mode 100644
index 0000000000..7d199ae333
--- /dev/null
+++ b/packages/classification-ggml/LICENSE
@@ -0,0 +1,179 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+Copyright 2026 Tether Data, S.A. de C.V.
diff --git a/packages/classification-ggml/NOTICE b/packages/classification-ggml/NOTICE
new file mode 100644
index 0000000000..0bb0b704b5
--- /dev/null
+++ b/packages/classification-ggml/NOTICE
@@ -0,0 +1,42 @@
+@qvac/classification-ggml
+Copyright 2026 Tether Operations Limited
+
+This product includes software developed by Tether Operations Limited
+(https://tether.io/).
+
+Licensed under the Apache License, Version 2.0 (the "License"); you may
+not use this file except in compliance with the License. You may obtain
+a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+
+================================================================================
+
+This product bundles the following third-party components:
+
+--------------------------------------------------------------------------------
+ggml — a tensor library for machine learning
+Copyright (c) 2022-2025 Georgi Gerganov
+Licensed under the MIT License.
+Source: https://github.com/ggerganov/ggml
+
+--------------------------------------------------------------------------------
+stb_image.h / stb_image_resize2.h — Sean Barrett's public-domain image library
+Licensed under the MIT License / Public Domain (dual).
+Source: https://github.com/nothings/stb
+
+--------------------------------------------------------------------------------
+MobileNetV3-Small (Howard et al., 2019) — reference architecture
+Weights shipped in this package are a 3-class fine-tune of the PyTorch /
+torchvision reference model. Original torchvision model and code are
+Copyright (c) Meta Platforms / PyTorch Contributors, BSD-3-Clause licensed.
+Paper: "Searching for MobileNetV3" (arXiv:1905.02244).
+
+The fine-tuned weight file (weights/mobilenetv3_3class_v3_fp16.gguf) is
+released under the Apache-2.0 license, same as this package.
diff --git a/packages/classification-ggml/README.md b/packages/classification-ggml/README.md
new file mode 100644
index 0000000000..60e7fd5ee1
--- /dev/null
+++ b/packages/classification-ggml/README.md
@@ -0,0 +1,229 @@
+# @qvac/classification-ggml
+
+GGML-powered image classification addon for QVAC. Runs a fine-tuned MobileNetV3-Small 3-class triage CNN on the CPU backend of `libggml` and exposes a small, stable JavaScript API. Now intended for a specific image triage, but can be easily adapted for other classification tasks.
+
+
+| Property      | Value                                           |
+| ------------- | ----------------------------------------------- |
+| Model         | MobileNetV3-Small (3 classes)                   |
+| Parameters    | ~2.5 M                                          |
+| Weights       | FP16 GGUF, **2.94 MB**, bundled in this package |
+| Input         | JPEG, PNG, or raw RGB bytes                     |
+| Resize target | 224 × 224 (bilinear)                            |
+| Normalization | ImageNet mean/std                               |
+| Backend       | `libggml` CPU (no GPU dependency)               |
+
+
+Package name: `@qvac/classification-ggml`  
+Directory: `packages/classification-ggml`
+
+## Install
+
+This addon is published to the `@qvac` scope and consumed like any other QVAC native addon. When used from the monorepo, `npm install` resolves `@qvac/infer-base` and `@qvac/logging` via the workspace.
+
+## Quickstart
+
+```js
+const ImageClassifier = require('@qvac/classification-ggml')
+
+const classifier = new ImageClassifier()
+await classifier.load()
+
+const imageBuffer = fs.readFileSync('./my-image.jpg')
+const result = await classifier.classify(imageBuffer)
+// [ { label: 'food',   confidence: 0.93 },
+//   { label: 'other',  confidence: 0.05 },
+//   { label: 'report', confidence: 0.02 } ]
+
+await classifier.unload()
+```
+
+### Raw RGB input
+
+```js
+const result = await classifier.classify(rgbBuffer, {
+  width: 320,
+  height: 240,
+  channels: 3,
+})
+```
+
+### topK filter
+
+By default `classify()` returns one entry per class, sorted from most likely to least likely. Pass `topK: N` to keep only the top `N` results — for example `topK: 1` returns just the single highest-scoring class:
+
+```js
+const best = await classifier.classify(buf, { topK: 1 })
+```
+
+## API
+
+
+| Method                             | Description                                                             |
+| ---------------------------------- | ----------------------------------------------------------------------- |
+| `new ImageClassifier(opts?)`       | `opts = { modelPath?, logger?, nativeLogger? }`                         |
+| `await load()`                     | Initialises the GGML backend and loads weights. Idempotent.             |
+| `await classify(buffer, options?)` | Runs inference. Returns `[{ label, confidence }, …]` sorted descending. |
+| `await unload()`                   | Releases native resources. Safe to call again.                          |
+| `await destroy()`                  | Releases resources and marks the instance as destroyed.                 |
+| `getState()`                       | Returns `{ configLoaded, destroyed }`.                                  |
+
+
+See `index.d.ts` for the full TypeScript surface.
+
+### Parameters
+
+#### `new ImageClassifier(opts?)`
+
+All constructor options are optional.
+
+
+| Option         | Type                | Default                                               | Description                                                                                                                                                                                                                                                                                                                            |
+| -------------- | ------------------- | ----------------------------------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `modelPath`    | `string`            | Bundled `weights/mobilenetv3_3class_v3_fp16.gguf`     | Absolute path to an FP16 GGUF file. Override only when pointing at a custom fine-tune produced by the ONNX→GGUF conversion guide. Also overridable via the `QVAC_CLASSIFICATION_MODEL_PATH` env variable.                                                                                                                              |
+| `logger`       | `QvacLogger`-shaped | `null`                                                | A sink with optional `error / warn / info / debug(msg)` methods (compatible with `@qvac/logging`). Receives JS-side `info` from a successful `load()` and `error` from a failed `load()`. With `nativeLogger: true`, also receives forwarded native `LogMsg` events at `info` level. Always honoured, regardless of `nativeLogger`.    |
+| `nativeLogger` | `boolean`           | `false`                                               | When `true`, native C++ `QLOG(...)` lines from inside the addon's model-loading and graph code are forwarded to `logger`. Disabled by default because the underlying `qvac-lib-inference-addon-cpp` logger is a process-wide singleton with a static `uv_async_t` that is not safe across rapid create/destroy cycles (e.g. in tests). |
+
+
+#### `await classify(imageInput, options?)`
+
+
+| Parameter                 | Type     | Default                   | Description                                                                                                                                                     |
+| ------------------------- | -------- | ------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `imageInput` *(required)* | `Buffer` | `Uint8Array`              | —                                                                                                                                                               |
+| `options.topK`            | `number` | `undefined` (all classes) | If set, the returned array is truncated to this many entries (top-K highest confidences). Must be a positive integer. Passing a value ≥ class count is a no-op. |
+| `options.width`           | `number` | —                         | **Required** for raw RGB input. Integer > 0. The underlying buffer must be exactly `width × height × channels` bytes; any mismatch throws a structured error.   |
+| `options.height`          | `number` | —                         | **Required** for raw RGB input. Integer > 0.                                                                                                                    |
+| `options.channels`        | `3`      | —                         | **Required** for raw RGB input. Must be exactly `3`. Grayscale and RGBA are not supported — decode or drop the alpha channel on the caller side.                |
+
+
+Returns `Promise<ClassificationResult[]>` where each entry is `{ label: string; confidence: number }`. The array is sorted by `confidence` descending, confidences are softmax probabilities in `[0, 1]` summing to ≈ 1, and `label` comes from the loaded GGUF's `mobilenet.class_N` metadata (so a future fine-tune can introduce new label strings without a code change).
+
+#### `await load()` / `await unload()` / `await destroy()`
+
+None take arguments. `load()` is idempotent — calling it twice is a no-op (check `getState().configLoaded` if you want to verify). `unload()` safely tears down the native handle and may be called multiple times. `destroy()` is equivalent to `unload()` plus a sticky `destroyed` flag in `getState()` — useful if your code wants to refuse reuse of a released instance.
+
+## Output contract
+
+- An array of `{ label: string, confidence: number }`.
+- Sorted by `confidence` descending.
+- `confidence` values are softmax probabilities in `[0, 1]` and sum to ≈ 1.
+- Labels come from the GGUF metadata (`mobilenet.class_0/1/2`). For the bundled weights these are `food`, `report`, `other`.
+
+## Build (from source, monorepo)
+
+Prerequisites: clang (LLVM ≥ 19) with matching `libc++-dev`, vcpkg, bare ≥ 1.24, bare-make. CI pins the exact LLVM major via the shared `setup-llvm` action; locally any recent clang works.
+
+```bash
+cd packages/classification-ggml
+npm install
+bare-make generate
+bare-make build
+bare-make install
+```
+
+One-liner: `npm install && bare-make generate && bare-make build && bare-make install`.
+
+## Testing
+
+```bash
+npm run test:integration     # brittle + bare JS integration tests (desktop)
+npm run test:cpp             # GoogleTest C++ unit tests
+npm run test:mobile:generate # regenerate test/mobile/integration.auto.cjs
+npm run test:mobile:validate # verify mobile test file structure
+```
+
+Integration tests live in `test/integration/*.test.js` and use the 6 sample images under `test/images/` (two images per class).
+
+### Mobile tests
+
+Mobile tests use the shared `qvac-test-addon-mobile` framework. The `test/mobile/integration.auto.cjs` file is auto-generated by `scripts/generate-mobile-integration-tests.js` from every `*.test.js` under `test/integration/`, so adding a new integration test automatically exposes it on mobile too.
+
+Before the mobile harness can be built, run
+
+```bash
+npm run mobile:copy-prebuilds
+```
+
+to populate `test/mobile/testAssets/` (driven by `scripts/copy-mobile-test-assets.js`). The script (a) fans out the single arm64 prebuild into the per-flavour directories the framework expects under `prebuilds/`, (b) copies the FP16 GGUF weights with a `.gguf.bin` suffix so the React Native bundler treats them as a binary asset, and (c) copies every `test/images/*.{jpg,jpeg,png}` into `testAssets/` so the integration tests can resolve them via `global.assetPaths` on-device. None of these copied files are checked into git. See [test/mobile/README.md](test/mobile/README.md) for the lifecycle note about the shared native logger.
+
+## Platform support
+
+
+| Platform            | CPU | Notes            |
+| ------------------- | --- | ---------------- |
+| Linux x64           | ✅   |                  |
+| Linux arm64         | ✅   |                  |
+| macOS arm64 (Apple) | ✅   |                  |
+| macOS x64 (Intel)   | ✅   |                  |
+| Windows x64         | ✅   |                  |
+| Android arm64       | ✅   | `c++_shared` STL |
+| iOS arm64           | ✅   |                  |
+
+
+All platforms are produced by the shared `reusable-prebuilds.yml`
+matrix and merged into a single `prebuilds` artifact for downstream
+consumption. GPU (Vulkan / Metal / CUDA) is not currently supported.
+
+## Performance
+
+Depending on the platform, one call to `classifier.classify(buffer)` takes from a few tens to a couple of hundred milliseconds.
+
+### What affects `classify()` latency
+
+- **CPU thread pool** — libggml sizes its internal CPU worker pool to `std::thread::hardware_concurrency` on every platform. The addon does not expose a tuning knob for this; if a future need arises, raise an issue and we can add one.
+- **Input size** — the JPEG/PNG decode and the `stb_image_resize2` bilinear pass scale with source pixel count. The 224×224 tensor pass is fixed-cost; a 12 MP phone photo adds real overhead vs. a 640×480 webcam frame.
+- **First-call overhead** — `load()` already runs a full-pipeline warmup (synthetic-pattern pass through preprocess + GGML compute + output read) before returning, so the GGML compute buffers, weight buffer, and worker thread are fully materialised when the first `classify()` is dispatched. Even so, the first user-supplied call is typically a few tens of milliseconds slower than the steady-state average.
+- **Re-use** — `load()` once, `classify()` many times. Tearing down and rebuilding the model for each image is roughly 4–6× slower end-to-end and is never necessary outside of tests.
+
+### Memory footprint
+
+
+| Component                                                  | Size            |
+| ---------------------------------------------------------- | --------------- |
+| Bundled FP16 weights (mmapped)                             | 2.94 MB         |
+| Backend weight buffer (FP16 + folded BN + FP32 classifier) | ≈ 5.5 MB        |
+| Intermediate activations (compute buffer)                  | single-digit MB |
+| **Total resident** during inference                        | **~8–10 MB**    |
+
+
+All GGML compute buffers (input tensor, intermediate activations, output) are allocated **once** at `load()` time and reused on every `classify()` call — `ggml_backend_tensor_set` / `_get` are the only operations that touch them per request. Per-call C++ allocations are bounded: one input-buffer copy across the bare-runtime boundary, the decoded RGB buffer, the resized 224×224 RGB buffer, the WHCN F32 tensor, and the 3-element softmax + result vectors. Multiple `ImageClassifier` instances each keep their own compute buffer and worker thread — you pay the ~8 MB once per instance.
+
+### Why FP16 weights?
+
+FP16 was chosen because it matches FP32 top-1 accuracy on the internal validation set while halving the on-disk footprint (≈3 MB vs ≈6 MB) and giving a measurable inference speed-up on every CPU backend we ship. More aggressive quantizations (Q8_0, Q4_K and below) were evaluated on the same validation set and showed noticeable accuracy degradation, which for a 3-class triage model is not acceptable. If you fine-tune your own MobileNetV3-Small, keep FP16 as the publish format unless you re-run the full validation suite at the lower precision.
+
+### Measuring locally
+
+The integration suite hooks the shared `scripts/test-utils/performance-reporter.js` via `test/integration/utils.js`. Running
+
+```bash
+npm run test:integration
+```
+
+writes `test/results/performance-report.json` with one `total_time_ms` entry per sample image, and in GitHub Actions also emits a Markdown step summary.
+
+## Architecture
+
+See `[docs/architecture.md](docs/architecture.md)` for the MobileNetV3-Small layer breakdown and graph construction notes, and `[docs/data-flow.md](docs/data-flow.md)` for the end-to-end request flow.
+
+### Why a custom GGML graph?
+
+`llama-cpp` doesn't support CNN architectures, so this addon bypasses `llama.cpp` entirely and talks to the stable `ggml_*` / `ggml_backend_*` public API.
+
+For this MobileNetV3-Small the GGML CPU backend is, in most configurations, slower per call than the same network running on a mature PyTorch or ONNX Runtime build with their hand-tuned convolution kernels. Because the model is very small (≈2.5 M params, single-digit-millisecond compute on a modern phone), the absolute gap is negligible for a triage workload and is dominated by image decode and JS↔native marshalling. If a substantially larger classifier is ever added on top of this same scaffolding, expect to invest extra effort in graph-level optimisations (operator fusion, matmul tiling, FP16 SIMD kernels, threadpool sizing) before the GGML path is competitive.
+
+## Converting a new model
+
+If you fine-tune or swap the underlying MobileNetV3 model, follow `[docs/onnx-to-gguf-conversion.md](docs/onnx-to-gguf-conversion.md)`. The graph construction is parameterised by `kBlocks` in `MobileNetGraph.hpp` — only classes and weights change between fine-tunes.
+
+## Troubleshooting
+
+- **“MobileNet GGUF weights not found”**: the default path is `<package>/weights/mobilenetv3_3class_v3_fp16.gguf`. Override with `new ImageClassifier({ modelPath: '/abs/path.gguf' })` or set the `QVAC_CLASSIFICATION_MODEL_PATH` env variable.
+- **All predictions look wrong**: verify the BN epsilon is still `0.001` (see the guarded unit test) — the architecture is unusually sensitive to this constant.
+- **Build fails looking for `stb_image.h`**: make sure the `stb` vcpkg port is installed. The `vcpkg-configuration.json` pins it.
+- **Mobile build fails looking for `libggml-cpu`**: the prebuild workflow copies all `ggml::${_backend}` targets into `prebuilds/`. Re-run `bare-make install`.
+
+## License
+
+Apache-2.0. See `[LICENSE](LICENSE)` and `[NOTICE](NOTICE)`.
\ No newline at end of file
diff --git a/packages/classification-ggml/addon.js b/packages/classification-ggml/addon.js
new file mode 100644
index 0000000000..98dd91e160
--- /dev/null
+++ b/packages/classification-ggml/addon.js
@@ -0,0 +1,109 @@
+'use strict'
+
+// Native JsLogger is a process-wide singleton (static uv_async_t in
+// addon-cpp); install its JS callback once, switch sinks per instance.
+let _loggerInstalled = false
+let _activeLoggerSink = null
+
+function _ensureLoggerInstalled (binding) {
+  if (_loggerInstalled) return
+  const levels = ['error', 'warn', 'info', 'debug']
+  binding.setLogger((priority, message) => {
+    const sink = _activeLoggerSink
+    if (!sink) return
+    const level = levels[priority] || 'info'
+    if (typeof sink[level] === 'function') {
+      try { sink[level](message) } catch (_) {}
+    }
+  })
+  _loggerInstalled = true
+}
+
+function _setActiveLoggerSink (sink) { _activeLoggerSink = sink }
+function _clearActiveLoggerSink (sink) {
+  if (_activeLoggerSink === sink) _activeLoggerSink = null
+}
+
+/**
+ * Normalize a raw native event to `Output` / `Error` / `LogMsg` /
+ * `JobEnded`, or `null` to drop. Keyed on payload shape because the
+ * upstream JobRunner emits the stats trailer with a raw RTTI event
+ * name (no `JobEnded` substring), so an array → `Output` and a plain
+ * object → terminal `JobEnded`.
+ */
+function mapAddonEvent (rawEvent, rawData, rawError) {
+  if (typeof rawEvent === 'string') {
+    if (rawEvent.includes('Error')) {
+      return { type: 'Error', data: rawData, error: rawError }
+    }
+    if (rawEvent.includes('LogMsg')) {
+      return { type: 'LogMsg', data: rawData, error: null }
+    }
+    if (rawEvent.includes('JobEnded')) {
+      return { type: 'JobEnded', data: rawData, error: null }
+    }
+    if (rawEvent.includes('JobStarted')) {
+      return null
+    }
+  }
+  if (Array.isArray(rawData)) {
+    return { type: 'Output', data: rawData, error: null }
+  }
+  if (rawData && typeof rawData === 'object') {
+    return { type: 'JobEnded', data: rawData, error: null }
+  }
+  return { type: rawEvent, data: rawData, error: rawError }
+}
+
+/**
+ * Thin JS↔native bridge owning one bare C++ instance handle. Lifecycle
+ * lives in `index.js`, mirroring `LlamaInterface` / `LlmLlamacpp`.
+ *
+ * `opts.disableNativeLogger` controls whether the native LogMsg bridge is
+ * armed for this instance; kept on a sibling arg so `configurationParams`
+ * stays 1:1 with the C++ schema (no JS-only `__`-prefixed flags).
+ */
+class ClassificationInterface {
+  constructor (binding, configurationParams, outputCb, logger = null, opts = {}) {
+    this._binding = binding
+    this._handle = null
+    this._logger = logger
+
+    if (logger && typeof logger === 'object' && !opts.disableNativeLogger) {
+      _ensureLoggerInstalled(binding)
+      _setActiveLoggerSink(logger)
+    }
+
+    this._handle = this._binding.createInstance(this, configurationParams, outputCb)
+  }
+
+  async activate () {
+    if (!this._handle) throw new Error('Classification addon is not initialized')
+    this._binding.activate(this._handle)
+  }
+
+  async runJob (input) {
+    if (!this._handle) throw new Error('Classification addon is not initialized')
+    return this._binding.runJob(this._handle, input)
+  }
+
+  async cancel () {
+    if (!this._handle) return
+    await this._binding.cancel(this._handle)
+  }
+
+  async unload () {
+    if (this._handle === null) return
+    if (this._logger) _clearActiveLoggerSink(this._logger)
+    try {
+      this._binding.destroyInstance(this._handle)
+    } finally {
+      this._handle = null
+    }
+  }
+}
+
+module.exports = {
+  ClassificationInterface,
+  mapAddonEvent
+}
diff --git a/packages/classification-ggml/addon/src/addon/AddonJs.hpp b/packages/classification-ggml/addon/src/addon/AddonJs.hpp
new file mode 100644
index 0000000000..753d469221
--- /dev/null
+++ b/packages/classification-ggml/addon/src/addon/AddonJs.hpp
@@ -0,0 +1,213 @@
+#pragma once
+
+#include <cstdio>
+#include <cstdlib>
+#include <memory>
+#include <string>
+#include <utility>
+#include <vector>
+
+#include <js.h>
+#include <inference-addon-cpp/Errors.hpp>
+#include <inference-addon-cpp/JsInterface.hpp>
+#include <inference-addon-cpp/JsUtils.hpp>
+#include <inference-addon-cpp/ModelInterfaces.hpp>
+#include <inference-addon-cpp/addon/AddonJs.hpp>
+#include <inference-addon-cpp/handlers/JsOutputHandlerImplementations.hpp>
+#include <inference-addon-cpp/handlers/OutputHandler.hpp>
+#include <inference-addon-cpp/queue/OutputCallbackJs.hpp>
+#include <inference-addon-cpp/queue/OutputQueue.hpp>
+
+#include "model-interface/ClassificationModel.hpp"
+
+namespace classification_ggml::bindings {
+
+namespace addon_cpp = qvac_lib_inference_addon_cpp;
+namespace jsu = qvac_lib_inference_addon_cpp::js;
+
+using qvac_errors::StatusError;
+using qvac_errors::general_error::InvalidArgument;
+
+/// `QVAC_CLASSIFICATION_TRACE=1` dumps each marshalled entry to stderr.
+struct JsClassifyOutputHandler
+    : addon_cpp::out_handl::JsBaseOutputHandler<ClassifyOutput> {
+  JsClassifyOutputHandler()
+      : JsBaseOutputHandler<ClassifyOutput>(
+            [this](const ClassifyOutput& cppOut) -> js_value_t* {
+              auto array = jsu::Array::create(this->env_);
+              const bool trace = []() {
+                const char* v = std::getenv("QVAC_CLASSIFICATION_TRACE");
+                return v != nullptr && v[0] == '1';
+              }();
+
+              for (size_t i = 0; i < cppOut.results.size(); ++i) {
+                const std::string& label = cppOut.results[i].label;
+                const double confidence =
+                    static_cast<double>(cppOut.results[i].confidence);
+
+                if (trace) {
+                  std::fprintf(
+                      stderr,
+                      "[qvac-classify-marshal] i=%zu label='%s' "
+                      "confidence=%.9f\n",
+                      i,
+                      label.c_str(),
+                      confidence);
+                  std::fflush(stderr);
+                }
+
+                auto entry = jsu::Object::create(this->env_);
+                entry.setProperty(
+                    this->env_,
+                    "label",
+                    jsu::String::create(this->env_, label));
+                entry.setProperty(
+                    this->env_,
+                    "confidence",
+                    jsu::Number::create(this->env_, confidence));
+                array.set(this->env_, i, entry);
+              }
+              return array;
+            }) {}
+};
+
+inline js_value_t* createInstance(
+    js_env_t* env, js_callback_info_t* info) try {
+  addon_cpp::JsArgsParser args(env, info);
+
+  auto configObj = args.getJsObject(1, "config");
+  auto modelPath =
+      configObj.getProperty<jsu::String>(env, "path").as<std::string>(env);
+  if (modelPath.empty()) {
+    throw StatusError(
+        InvalidArgument,
+        "Configuration 'path' is required and must be a non-empty string "
+        "pointing at the FP16 GGUF weights file");
+  }
+
+  auto model = std::make_unique<ClassificationModel>(modelPath);
+
+  auto innerConfig =
+      configObj.getOptionalProperty<jsu::Object>(env, "config");
+  if (innerConfig.has_value()) {
+    auto backendsDirOpt =
+        innerConfig->getOptionalProperty<jsu::String>(env, "backendsDir");
+    if (backendsDirOpt.has_value()) {
+      model->setBackendsDir(backendsDirOpt->as<std::string>(env));
+    }
+  }
+
+  model->load();
+
+  addon_cpp::out_handl::OutputHandlers<addon_cpp::out_handl::JsOutputHandlerInterface>
+      outHandlers;
+  outHandlers.add(std::make_shared<JsClassifyOutputHandler>());
+
+  auto callback = std::make_unique<addon_cpp::OutputCallBackJs>(
+      env, args.get(0, "jsHandle"), args.getFunction(2, "outputCallback"),
+      std::move(outHandlers));
+
+  auto addon = std::make_unique<addon_cpp::AddonJs>(
+      env, std::move(callback),
+      std::unique_ptr<addon_cpp::model::IModel>(std::move(model)));
+
+  return addon_cpp::JsInterface::createInstance(env, std::move(addon));
+}
+JSCATCH
+
+inline js_value_t* runJob(js_env_t* env, js_callback_info_t* info) try {
+  addon_cpp::JsArgsParser args(env, info);
+  addon_cpp::AddonJs& instance =
+      addon_cpp::JsInterface::getInstance(env, args.get(0, "instance"));
+
+  auto inputObj = args.getJsObject(1, "inputObj");
+  auto type =
+      inputObj.getProperty<jsu::String>(env, "type").as<std::string>(env);
+  if (type != "image") {
+    throw StatusError(
+        InvalidArgument,
+        "Classification addon accepts only 'image' input type, got '" + type +
+            "'");
+  }
+
+  ClassifyInput cppInput;
+
+  // Error wording is a test contract: integration suite asserts on the
+  // substrings "required" / "null" / "undefined" for the null-input case.
+  auto bufferVal = inputObj.getProperty(env, "content");
+  if (!jsu::is<jsu::TypedArray<uint8_t>>(env, bufferVal)) {
+    throw StatusError(
+        InvalidArgument,
+        "Image 'content' is required and must be a Uint8Array / Buffer of "
+        "encoded JPEG/PNG bytes or raw RGB bytes (got null, undefined, or "
+        "wrong type)");
+  }
+  auto ta = jsu::TypedArray<uint8_t>(env, bufferVal);
+  auto span = ta.as<std::span<const uint8_t>>(env);
+  if (span.empty()) {
+    throw StatusError(InvalidArgument, "Image 'content' buffer is empty");
+  }
+  cppInput.data.assign(span.begin(), span.end());
+
+  // {width, height, channels} are an all-or-nothing trio: zero present
+  // means encoded JPEG/PNG, three present means raw RGB.
+  auto widthOpt = inputObj.getOptionalProperty<jsu::Number>(env, "width");
+  auto heightOpt = inputObj.getOptionalProperty<jsu::Number>(env, "height");
+  auto channelsOpt =
+      inputObj.getOptionalProperty<jsu::Number>(env, "channels");
+  const int provided = (widthOpt.has_value() ? 1 : 0) +
+                       (heightOpt.has_value() ? 1 : 0) +
+                       (channelsOpt.has_value() ? 1 : 0);
+  if (provided != 0 && provided != 3) {
+    throw StatusError(
+        InvalidArgument,
+        "Raw RGB input requires all of 'width', 'height', and 'channels' "
+        "to be provided together; received " + std::to_string(provided) +
+        " of 3");
+  }
+  if (provided == 3) {
+    // bare-runtime's `as<uint32_t>` static_casts negatives to ~4 billion;
+    // pull the int32_t view first to range-check meaningfully.
+    const int32_t w = widthOpt->as<int32_t>(env);
+    const int32_t h = heightOpt->as<int32_t>(env);
+    const int32_t c = channelsOpt->as<int32_t>(env);
+    if (w <= 0) {
+      throw StatusError(
+          InvalidArgument,
+          "Image 'width' must be a positive integer when passing raw RGB "
+          "bytes; got " + std::to_string(w));
+    }
+    if (h <= 0) {
+      throw StatusError(
+          InvalidArgument,
+          "Image 'height' must be a positive integer when passing raw RGB "
+          "bytes; got " + std::to_string(h));
+    }
+    if (c != 3) {
+      throw StatusError(
+          InvalidArgument,
+          "Image 'channels' must be exactly 3 (RGB) when passing raw RGB "
+          "bytes; got " + std::to_string(c));
+    }
+    cppInput.rawRgb = RawRgbDims{
+        static_cast<uint32_t>(w), static_cast<uint32_t>(h),
+        static_cast<uint32_t>(c)};
+  }
+
+  auto topKOpt = inputObj.getOptionalProperty<jsu::Number>(env, "topK");
+  if (topKOpt.has_value()) {
+    const int32_t topK = topKOpt->as<int32_t>(env);
+    if (topK <= 0) {
+      throw StatusError(
+          InvalidArgument,
+          "Image 'topK' must be a positive integer when provided; got " +
+              std::to_string(topK));
+    }
+    cppInput.topK = static_cast<uint32_t>(topK);
+  }
+
+  return instance.runJob(std::any(std::move(cppInput)));
+}
+JSCATCH
+
+} // namespace classification_ggml::bindings
diff --git a/packages/classification-ggml/addon/src/js-interface/binding.cpp b/packages/classification-ggml/addon/src/js-interface/binding.cpp
new file mode 100644
index 0000000000..875f816043
--- /dev/null
+++ b/packages/classification-ggml/addon/src/js-interface/binding.cpp
@@ -0,0 +1,38 @@
+#include <bare.h>
+
+#include "addon/AddonJs.hpp"
+
+js_value_t* classification_ggml_exports(
+    js_env_t* env,
+    js_value_t* exports) { // NOLINT(readability-identifier-naming)
+
+// NOLINTBEGIN(cppcoreguidelines-macro-usage)
+#define V(name, fn)                                                            \
+  {                                                                            \
+    js_value_t* val;                                                           \
+    if (js_create_function(env, name, -1, fn, nullptr, &val) != 0) {           \
+      return nullptr;                                                          \
+    }                                                                          \
+    if (js_set_named_property(env, exports, name, val) != 0) {                 \
+      return nullptr;                                                          \
+    }                                                                          \
+  }
+
+  V("createInstance", classification_ggml::bindings::createInstance)
+  V("runJob", classification_ggml::bindings::runJob)
+
+  V("loadWeights", qvac_lib_inference_addon_cpp::JsInterface::loadWeights)
+  V("activate", qvac_lib_inference_addon_cpp::JsInterface::activate)
+  V("cancel", qvac_lib_inference_addon_cpp::JsInterface::cancel)
+  V("destroyInstance",
+    qvac_lib_inference_addon_cpp::JsInterface::destroyInstance)
+  V("setLogger", qvac_lib_inference_addon_cpp::JsInterface::setLogger)
+  V("releaseLogger", qvac_lib_inference_addon_cpp::JsInterface::releaseLogger)
+
+#undef V
+  // NOLINTEND(cppcoreguidelines-macro-usage)
+
+  return exports;
+}
+
+BARE_MODULE(classification_ggml, classification_ggml_exports)
diff --git a/packages/classification-ggml/addon/src/model-interface/ClassificationModel.cpp b/packages/classification-ggml/addon/src/model-interface/ClassificationModel.cpp
new file mode 100644
index 0000000000..72677e3d75
--- /dev/null
+++ b/packages/classification-ggml/addon/src/model-interface/ClassificationModel.cpp
@@ -0,0 +1,325 @@
+#include "ClassificationModel.hpp"
+
+#include <algorithm>
+#include <chrono>
+#include <cmath>
+#include <cstdint>
+#include <cstdio>
+#include <cstdlib>
+#include <limits>
+#include <numeric>
+#include <span>
+#include <stdexcept>
+#include <string>
+#include <vector>
+
+#if defined(__ANDROID__)
+#include <filesystem>
+#endif
+
+#include <ggml-alloc.h>
+#include <ggml-backend.h>
+#include <ggml-cpu.h>
+#include <ggml.h>
+#include <gguf.h>
+#include <inference-addon-cpp/Errors.hpp>
+#include <inference-addon-cpp/Logger.hpp>
+
+#include "ImagePreprocessor.hpp"
+#include "MobileNetGraph.hpp"
+
+namespace classification_ggml {
+
+using qvac_errors::StatusError;
+using qvac_errors::general_error::InternalError;
+using qvac_errors::general_error::InvalidArgument;
+
+namespace {
+constexpr const char* kModelName = "mobilenetv3-small-ggml-classification";
+} // namespace
+
+ClassificationModel::ClassificationModel(std::string modelPath)
+    : modelPath_(std::move(modelPath)) {}
+
+ClassificationModel::~ClassificationModel() {
+  // ggml requires buffers to be freed strictly before the backend they were
+  // allocated on; reset both before ggml_backend_free.
+  compute_.reset();
+  weights_.reset();
+  if (backend_ != nullptr) {
+    ggml_backend_free(backend_);
+    backend_ = nullptr;
+  }
+}
+
+std::string ClassificationModel::getName() const {
+  return kModelName;
+}
+
+qvac_lib_inference_addon_cpp::RuntimeStats
+ClassificationModel::runtimeStats() const {
+  using qvac_lib_inference_addon_cpp::RuntimeStats;
+  RuntimeStats stats;
+  const double totalMs = static_cast<double>(lastInferenceUs_) / 1000.0;
+  stats.emplace_back("total_time_ms", totalMs);
+  return stats;
+}
+
+void ClassificationModel::setBackendsDir(std::string backendsDir) {
+  std::scoped_lock lock(mutex_);
+  backendsDir_ = std::move(backendsDir);
+}
+
+namespace {
+
+/// Numerically stable softmax. Falls back to a uniform distribution if
+/// every logit is non-finite or the exp sum overflows, so downstream
+/// code always sees a probability vector that sums to 1.
+std::vector<float> softmax(std::span<const float> logits) {
+  if (logits.empty()) {
+    return {};
+  }
+
+  // std::max_element on a span containing NaN is unspecified.
+  float maxLogit = -std::numeric_limits<float>::infinity();
+  for (const float logit : logits) {
+    if (std::isfinite(logit) && logit > maxLogit) {
+      maxLogit = logit;
+    }
+  }
+  if (!std::isfinite(maxLogit)) {
+    const float uniform = 1.0F / static_cast<float>(logits.size());
+    return std::vector<float>(logits.size(), uniform);
+  }
+
+  std::vector<float> probs(logits.size());
+  float sum = 0.0F;
+  for (size_t i = 0; i < logits.size(); ++i) {
+    const float diff = logits[i] - maxLogit;
+    const float e = std::isfinite(diff) ? std::exp(diff) : 0.0F;
+    probs[i] = e;
+    sum += e;
+  }
+
+  if (std::isfinite(sum) && sum > 0.0F) {
+    const float inv = 1.0F / sum;
+    for (float& p : probs) {
+      p *= inv;
+    }
+  } else {
+    const float uniform = 1.0F / static_cast<float>(logits.size());
+    std::fill(probs.begin(), probs.end(), uniform);
+  }
+  return probs;
+}
+
+bool traceEnabled() {
+  const char* v = std::getenv("QVAC_CLASSIFICATION_TRACE");
+  return v != nullptr && v[0] == '1';
+}
+
+} // namespace
+
+void ClassificationModel::load() {
+  std::scoped_lock lock(mutex_);
+  if (loaded_) {
+    return;
+  }
+  if (modelPath_.empty()) {
+    throw StatusError(
+        InvalidArgument,
+        "ClassificationModel requires a path to mobilenetv3 FP16 GGUF weights");
+  }
+
+#if defined(__ANDROID__)
+  // qvac-fabric on Android ships per-microarch CPU variants as MODULE
+  // .so files loaded at runtime via dlopen. ggml_backend_cpu_init() is
+  // not statically linkable here (symbol lives inside the variant .so),
+  // so we open the variants from <backendsDir>/<BACKENDS_SUBDIR>/ and
+  // pick a CPU device through the generic registry API.
+  //
+  // backendsDir comes from JS (`path.join(__dirname, 'prebuilds')`,
+  // mirroring the llamacpp-llm addon) and BACKENDS_SUBDIR is the
+  // compile-time `<bare_target>/<module_name>` relative path.
+  if (backendsDir_.empty()) {
+    throw StatusError(
+        InvalidArgument,
+        "Configuration 'config.backendsDir' is required on Android");
+  }
+  std::filesystem::path variantsDir =
+      std::filesystem::path(backendsDir_) / BACKENDS_SUBDIR;
+  ggml_backend_load_all_from_path(variantsDir.string().c_str());
+
+  ggml_backend_dev_t cpuDev =
+      ggml_backend_dev_by_type(GGML_BACKEND_DEVICE_TYPE_CPU);
+  if (cpuDev == nullptr) {
+    throw StatusError(
+        InternalError,
+        "No CPU backend device registered after loading variants from " +
+            variantsDir.string());
+  }
+  backend_ = ggml_backend_dev_init(cpuDev, /*params=*/nullptr);
+#else
+  backend_ = ggml_backend_cpu_init();
+#endif
+  if (backend_ == nullptr) {
+    throw StatusError(InternalError, "Failed to initialize ggml CPU backend");
+  }
+
+  labels_.clear();
+  weights_ = graph::loadWeights(modelPath_, backend_, labels_);
+  if (labels_.empty()) {
+    labels_ = {"food", "report", "other"};
+  }
+  compute_ = graph::buildGraph(weights_, backend_);
+
+  // One full forward pass at load() time. Without it, the first
+  // user-visible classify() can return NaN logits on win32-x64 CI
+  // because some backend allocator buffers are uninitialised after
+  // buildGraph() and CPU backends can JIT SIMD kernels on cold input.
+  // Symmetric with process(): set, compute, read back, discard.
+  {
+    constexpr uint32_t kWarmupSide = 32;
+    std::vector<uint8_t> warmupRgb(
+        static_cast<size_t>(kWarmupSide) * kWarmupSide * preprocess::kChannels);
+    for (size_t i = 0; i < warmupRgb.size(); ++i) {
+      warmupRgb[i] = static_cast<uint8_t>((i * 7) & 0xFFU);
+    }
+    std::vector<float> warmupTensor = preprocess::preprocessToTensor(
+        std::span<const uint8_t>(warmupRgb.data(), warmupRgb.size()),
+        kWarmupSide, kWarmupSide, preprocess::kChannels);
+    ggml_backend_tensor_set(
+        compute_.input, warmupTensor.data(), 0,
+        warmupTensor.size() * sizeof(float));
+    (void)ggml_backend_graph_compute(backend_, compute_.graph);
+    float warmupLogits[graph::kNumClasses] = {0.0F};
+    ggml_backend_tensor_get(
+        compute_.output, warmupLogits, 0, sizeof(warmupLogits));
+    (void)warmupLogits;
+  }
+
+  loaded_ = true;
+
+  QLOG(
+      qvac_lib_inference_addon_cpp::logger::Priority::INFO,
+      std::string("ClassificationModel loaded (") +
+          std::to_string(labels_.size()) + " classes)");
+}
+
+std::any ClassificationModel::process(const std::any& input) {
+  std::scoped_lock lock(mutex_);
+
+  const auto* inPtr = std::any_cast<ClassifyInput>(&input);
+  if (inPtr == nullptr) {
+    throw StatusError(InvalidArgument, "ClassificationModel: invalid input type");
+  }
+  if (!loaded_) {
+    throw StatusError(
+        InternalError,
+        "ClassificationModel: classify() called before load() or after unload()");
+  }
+
+  const auto t0 = std::chrono::steady_clock::now();
+
+  // The preprocessor's legacy encoded-path sentinel is `uint32_t == 0`;
+  // collapse the optional<RawRgbDims> to that triplet at this boundary.
+  const uint32_t rawW = inPtr->rawRgb.has_value() ? inPtr->rawRgb->width : 0;
+  const uint32_t rawH = inPtr->rawRgb.has_value() ? inPtr->rawRgb->height : 0;
+  const uint32_t rawC =
+      inPtr->rawRgb.has_value() ? inPtr->rawRgb->channels : 0;
+  std::vector<float> inputTensor = preprocess::preprocessToTensor(
+      std::span<const uint8_t>(inPtr->data.data(), inPtr->data.size()),
+      rawW, rawH, rawC);
+
+  const size_t expected = static_cast<size_t>(preprocess::kInputSize) *
+                          preprocess::kInputSize * preprocess::kChannels;
+  if (inputTensor.size() != expected) {
+    throw StatusError(
+        InternalError, "ClassificationModel: preprocessed tensor has wrong size");
+  }
+
+  ggml_backend_tensor_set(
+      compute_.input, inputTensor.data(), 0,
+      inputTensor.size() * sizeof(float));
+
+  ggml_status status =
+      ggml_backend_graph_compute(backend_, compute_.graph);
+  if (status != GGML_STATUS_SUCCESS) {
+    throw StatusError(
+        InternalError, "ggml_backend_graph_compute failed with status " +
+                           std::to_string(static_cast<int>(status)));
+  }
+
+  float logits[graph::kNumClasses] = {0.0F};
+  ggml_backend_tensor_get(
+      compute_.output, logits, 0, sizeof(logits));
+
+  std::vector<float> probs = softmax(std::span<const float>(logits, graph::kNumClasses));
+
+  ClassifyOutput output;
+  output.results.reserve(probs.size());
+  for (size_t i = 0; i < probs.size(); ++i) {
+    const std::string label = i < labels_.size()
+                                  ? labels_[i]
+                                  : std::string("class_") + std::to_string(i);
+    output.results.push_back({label, probs[i]});
+  }
+
+  // Treat NaN/Inf as smaller than any finite value so the ordering
+  // stays strict-weak even if a future ggml regression slips a
+  // non-finite past the defensive softmax above.
+  std::sort(
+      output.results.begin(),
+      output.results.end(),
+      [](const ClassifyResult& a, const ClassifyResult& b) {
+        const bool aFinite = std::isfinite(a.confidence);
+        const bool bFinite = std::isfinite(b.confidence);
+        if (aFinite != bFinite) {
+          return aFinite;
+        }
+        if (!aFinite && !bFinite) {
+          return false;
+        }
+        return a.confidence > b.confidence;
+      });
+
+  if (traceEnabled()) {
+    std::fprintf(
+        stderr,
+        "[qvac-classify] logits=[%.6f, %.6f, %.6f] "
+        "probs_before_sort=[%.6f, %.6f, %.6f] "
+        "sorted=[{%s:%.6f}, {%s:%.6f}, {%s:%.6f}]\n",
+        static_cast<double>(logits[0]),
+        static_cast<double>(logits[1]),
+        static_cast<double>(logits[2]),
+        static_cast<double>(probs[0]),
+        static_cast<double>(probs[1]),
+        static_cast<double>(probs[2]),
+        output.results.size() > 0 ? output.results[0].label.c_str() : "-",
+        output.results.size() > 0
+            ? static_cast<double>(output.results[0].confidence)
+            : 0.0,
+        output.results.size() > 1 ? output.results[1].label.c_str() : "-",
+        output.results.size() > 1
+            ? static_cast<double>(output.results[1].confidence)
+            : 0.0,
+        output.results.size() > 2 ? output.results[2].label.c_str() : "-",
+        output.results.size() > 2
+            ? static_cast<double>(output.results[2].confidence)
+            : 0.0);
+    std::fflush(stderr);
+  }
+
+  if (inPtr->topK > 0 && inPtr->topK < output.results.size()) {
+    output.results.resize(inPtr->topK);
+  }
+
+  const auto t1 = std::chrono::steady_clock::now();
+  lastInferenceUs_ = static_cast<uint64_t>(
+      std::chrono::duration_cast<std::chrono::microseconds>(t1 - t0).count());
+
+  return std::any(std::move(output));
+}
+
+} // namespace classification_ggml
+
diff --git a/packages/classification-ggml/addon/src/model-interface/ClassificationModel.hpp b/packages/classification-ggml/addon/src/model-interface/ClassificationModel.hpp
new file mode 100644
index 0000000000..0c1004f480
--- /dev/null
+++ b/packages/classification-ggml/addon/src/model-interface/ClassificationModel.hpp
@@ -0,0 +1,80 @@
+#pragma once
+
+#include <cstdint>
+#include <memory>
+#include <mutex>
+#include <optional>
+#include <span>
+#include <string>
+#include <variant>
+#include <vector>
+
+#include <ggml-backend.h>
+#include <inference-addon-cpp/ModelInterfaces.hpp>
+#include <inference-addon-cpp/RuntimeStats.hpp>
+
+#include "MobileNetGraph.hpp"
+
+namespace classification_ggml {
+
+struct RawRgbDims {
+  uint32_t width;
+  uint32_t height;
+  uint32_t channels;
+};
+
+/// Raw classify input. `rawRgb` present = caller-supplied RGB bytes;
+/// absent = encoded JPEG/PNG, dimensions come from the decoder.
+struct ClassifyInput {
+  std::vector<uint8_t> data;
+  std::optional<RawRgbDims> rawRgb;
+  uint32_t topK = 0; // 0 = no topK filter
+};
+
+struct ClassifyResult {
+  std::string label;
+  float confidence;
+};
+
+/// Sorted by confidence descending.
+struct ClassifyOutput {
+  std::vector<ClassifyResult> results;
+};
+
+/// MobileNetV3-Small 3-class classifier on libggml's CPU backend.
+class ClassificationModel
+    : public qvac_lib_inference_addon_cpp::model::IModel {
+public:
+  explicit ClassificationModel(std::string modelPath);
+  ~ClassificationModel() override;
+
+  ClassificationModel(const ClassificationModel&) = delete;
+  ClassificationModel& operator=(const ClassificationModel&) = delete;
+
+  [[nodiscard]] std::string getName() const override;
+  std::any process(const std::any& input) override;
+  [[nodiscard]] qvac_lib_inference_addon_cpp::RuntimeStats
+  runtimeStats() const override;
+
+  /// Called from createInstance so load failures surface synchronously.
+  void load();
+
+  /// Optional addon-prebuilds root (e.g. `<addon>/prebuilds`). On Android
+  /// it's combined with the BACKENDS_SUBDIR compile-time relative path to
+  /// locate the per-microarch CPU variant .so files for ggml's runtime
+  /// backend loader. No-op on platforms where the CPU backend is static.
+  void setBackendsDir(std::string backendsDir);
+
+private:
+  std::string modelPath_;
+  std::string backendsDir_;
+  ggml_backend_t backend_ = nullptr;
+  graph::WeightsBundle weights_;
+  graph::ComputeGraph compute_;
+  std::vector<std::string> labels_;
+  bool loaded_ = false;
+  uint64_t lastInferenceUs_ = 0;
+  mutable std::mutex mutex_;
+};
+
+} // namespace classification_ggml
diff --git a/packages/classification-ggml/addon/src/model-interface/ImagePreprocessor.cpp b/packages/classification-ggml/addon/src/model-interface/ImagePreprocessor.cpp
new file mode 100644
index 0000000000..a8c9452946
--- /dev/null
+++ b/packages/classification-ggml/addon/src/model-interface/ImagePreprocessor.cpp
@@ -0,0 +1,231 @@
+#include "ImagePreprocessor.hpp"
+
+#include <algorithm>
+#include <cstdlib>
+#include <limits>
+#include <stdexcept>
+#include <string>
+
+#include <inference-addon-cpp/Errors.hpp>
+
+// stb single-header implementations live here for the whole addon.
+#define STB_IMAGE_IMPLEMENTATION
+#define STB_IMAGE_RESIZE_IMPLEMENTATION
+#include <stb_image.h>
+#include <stb_image_resize2.h>
+
+namespace classification_ggml::preprocess {
+
+namespace {
+using qvac_errors::general_error::InvalidArgument;
+using qvac_errors::StatusError;
+
+constexpr size_t kDecodedChannels = 3;
+
+[[noreturn]] void raise(const std::string& message) {
+  throw StatusError(InvalidArgument, message);
+}
+
+bool startsWith(
+    std::span<const uint8_t> buffer, std::span<const uint8_t> prefix) {
+  if (buffer.size() < prefix.size()) {
+    return false;
+  }
+  for (size_t i = 0; i < prefix.size(); ++i) {
+    if (buffer[i] != prefix[i]) {
+      return false;
+    }
+  }
+  return true;
+}
+} // namespace
+
+bool isEncodedImage(std::span<const uint8_t> buffer) {
+  // JPEG: FF D8 FF ...
+  constexpr std::array<uint8_t, 3> kJpegMagic = {0xFF, 0xD8, 0xFF};
+  // PNG:  89 50 4E 47 0D 0A 1A 0A
+  constexpr std::array<uint8_t, 8> kPngMagic = {
+      0x89, 0x50, 0x4E, 0x47, 0x0D, 0x0A, 0x1A, 0x0A};
+
+  return startsWith(buffer, kJpegMagic) || startsWith(buffer, kPngMagic);
+}
+
+std::vector<uint8_t> decodeToRgb(
+    std::span<const uint8_t> encodedBuffer, uint32_t& outWidth,
+    uint32_t& outHeight) {
+  if (encodedBuffer.empty()) {
+    raise("Input image buffer is empty");
+  }
+  if (encodedBuffer.size() >
+      static_cast<size_t>(std::numeric_limits<int>::max())) {
+    raise("Input image buffer too large for decoder");
+  }
+
+  // Header-only inspection so we can reject oversized images before
+  // stbi_load allocates the full RGB buffer (~300 MB for 100 MP).
+  // stbi_info returning 0 = header unparseable; defer to stbi_load
+  // below so the caller gets stbi_failure_reason() instead of a
+  // generic "header bad" from us.
+  {
+    int infoWidth = 0;
+    int infoHeight = 0;
+    int infoChannels = 0;
+    if (stbi_info_from_memory(
+            encodedBuffer.data(), static_cast<int>(encodedBuffer.size()),
+            &infoWidth, &infoHeight, &infoChannels) != 0) {
+      if (infoWidth <= 0 || infoHeight <= 0) {
+        raise("Decoded image has invalid dimensions");
+      }
+      if (static_cast<uint32_t>(infoWidth) > kMaxImageDimension ||
+          static_cast<uint32_t>(infoHeight) > kMaxImageDimension) {
+        raise(
+            "Image exceeds maximum allowed dimension (" +
+            std::to_string(kMaxImageDimension) + " px per axis); header "
+            "reported " + std::to_string(infoWidth) + "x" +
+            std::to_string(infoHeight));
+      }
+    }
+  }
+
+  int width = 0;
+  int height = 0;
+  int channelsIgnored = 0;
+  // Force 3 output channels — downstream never deals with alpha/grayscale.
+  uint8_t* pixels = stbi_load_from_memory(
+      encodedBuffer.data(), static_cast<int>(encodedBuffer.size()), &width,
+      &height, &channelsIgnored, static_cast<int>(kDecodedChannels));
+
+  if (pixels == nullptr) {
+    const char* reason = stbi_failure_reason();
+    std::string msg = "Failed to decode image (only JPEG and PNG are supported)";
+    if (reason != nullptr) {
+      msg += ": ";
+      msg += reason;
+    }
+    raise(msg);
+  }
+
+  if (width <= 0 || height <= 0) {
+    stbi_image_free(pixels);
+    raise("Decoded image has invalid dimensions");
+  }
+  if (static_cast<uint32_t>(width) > kMaxImageDimension ||
+      static_cast<uint32_t>(height) > kMaxImageDimension) {
+    stbi_image_free(pixels);
+    raise(
+        "Image exceeds maximum allowed dimension (" +
+        std::to_string(kMaxImageDimension) + " px per axis)");
+  }
+
+  const size_t byteCount = static_cast<size_t>(width) *
+                           static_cast<size_t>(height) * kDecodedChannels;
+  std::vector<uint8_t> out(pixels, pixels + byteCount);
+  stbi_image_free(pixels);
+
+  outWidth = static_cast<uint32_t>(width);
+  outHeight = static_cast<uint32_t>(height);
+  return out;
+}
+
+void validateRawRgb(
+    std::span<const uint8_t> rawBuffer, uint32_t width, uint32_t height,
+    uint32_t channels) {
+  if (rawBuffer.empty()) {
+    raise("Raw image buffer is empty");
+  }
+  if (channels != kChannels) {
+    raise(
+        "Raw image must have exactly 3 channels (RGB); got " +
+        std::to_string(channels));
+  }
+  if (width == 0 || height == 0) {
+    raise("Raw image width and height must be greater than zero");
+  }
+  if (width > kMaxImageDimension || height > kMaxImageDimension) {
+    raise(
+        "Raw image exceeds maximum allowed dimension (" +
+        std::to_string(kMaxImageDimension) + " px per axis)");
+  }
+  const size_t expected = static_cast<size_t>(width) *
+                          static_cast<size_t>(height) *
+                          static_cast<size_t>(channels);
+  if (rawBuffer.size() != expected) {
+    raise(
+        "Raw image buffer size " + std::to_string(rawBuffer.size()) +
+        " does not match declared dimensions " + std::to_string(width) + "x" +
+        std::to_string(height) + "x" + std::to_string(channels) +
+        " (expected " + std::to_string(expected) + " bytes)");
+  }
+}
+
+std::vector<uint8_t> resizeToInput(
+    std::span<const uint8_t> srcRgb, uint32_t srcWidth, uint32_t srcHeight) {
+  std::vector<uint8_t> out(kInputSize * kInputSize * kChannels);
+  unsigned char* ok = stbir_resize_uint8_linear(
+      srcRgb.data(), static_cast<int>(srcWidth), static_cast<int>(srcHeight),
+      static_cast<int>(srcWidth * kChannels), out.data(),
+      static_cast<int>(kInputSize), static_cast<int>(kInputSize),
+      static_cast<int>(kInputSize * kChannels), STBIR_RGB);
+  if (ok == nullptr) {
+    raise("Failed to resize image to 224x224");
+  }
+  return out;
+}
+
+std::vector<float> normalizeToWhcn(std::span<const uint8_t> rgb224) {
+  if (rgb224.size() !=
+      static_cast<size_t>(kInputSize) * kInputSize * kChannels) {
+    raise("Internal error: resized buffer does not have expected size");
+  }
+  constexpr float kUnit = 1.0F / 255.0F;
+
+  // ggml WHCN: contiguous, fastest-varying axis = width.
+  // offset(w, h, c) = c*H*W + h*W + w
+  std::vector<float> out(static_cast<size_t>(kInputSize) * kInputSize * kChannels);
+  const size_t plane = static_cast<size_t>(kInputSize) * kInputSize;
+
+  for (uint32_t y = 0; y < kInputSize; ++y) {
+    for (uint32_t x = 0; x < kInputSize; ++x) {
+      const size_t srcIdx =
+          (static_cast<size_t>(y) * kInputSize + x) * kChannels;
+      const size_t dstBase = static_cast<size_t>(y) * kInputSize + x;
+      for (uint32_t c = 0; c < kChannels; ++c) {
+        const float pixel = static_cast<float>(rgb224[srcIdx + c]) * kUnit;
+        out[c * plane + dstBase] =
+            (pixel - kImageNetMean[c]) / kImageNetStd[c];
+      }
+    }
+  }
+  return out;
+}
+
+std::vector<float> preprocessToTensor(
+    std::span<const uint8_t> input, uint32_t declaredWidth,
+    uint32_t declaredHeight, uint32_t declaredChannels) {
+  if (input.empty()) {
+    raise("Input image buffer is empty");
+  }
+
+  std::vector<uint8_t> rgb;
+  uint32_t width = 0;
+  uint32_t height = 0;
+
+  if (declaredWidth > 0 || declaredHeight > 0 || declaredChannels > 0) {
+    validateRawRgb(input, declaredWidth, declaredHeight, declaredChannels);
+    rgb.assign(input.begin(), input.end());
+    width = declaredWidth;
+    height = declaredHeight;
+  } else {
+    if (!isEncodedImage(input)) {
+      raise(
+          "Unsupported image format: expected JPEG or PNG, or pass "
+          "'{ width, height, channels: 3 }' with raw RGB bytes");
+    }
+    rgb = decodeToRgb(input, width, height);
+  }
+
+  std::vector<uint8_t> resized = resizeToInput(rgb, width, height);
+  return normalizeToWhcn(resized);
+}
+
+} // namespace classification_ggml::preprocess
diff --git a/packages/classification-ggml/addon/src/model-interface/ImagePreprocessor.hpp b/packages/classification-ggml/addon/src/model-interface/ImagePreprocessor.hpp
new file mode 100644
index 0000000000..ba76331477
--- /dev/null
+++ b/packages/classification-ggml/addon/src/model-interface/ImagePreprocessor.hpp
@@ -0,0 +1,45 @@
+#pragma once
+
+#include <array>
+#include <cstdint>
+#include <span>
+#include <vector>
+
+namespace classification_ggml::preprocess {
+
+constexpr uint32_t kInputSize = 224;
+constexpr uint32_t kChannels = 3;
+/// OOM defence — reject inputs larger than this on either axis.
+constexpr uint32_t kMaxImageDimension = 16384;
+
+/// ImageNet per-channel normalization, matching torchvision's MobileNetV3.
+constexpr std::array<float, 3> kImageNetMean = {0.485F, 0.456F, 0.406F};
+constexpr std::array<float, 3> kImageNetStd = {0.229F, 0.224F, 0.225F};
+
+/// True for JPEG/PNG magic bytes; false routes to the raw-RGB path.
+bool isEncodedImage(std::span<const uint8_t> buffer);
+
+/// Decode JPEG/PNG to packed RGB. Throws StatusError on any failure.
+std::vector<uint8_t> decodeToRgb(
+    std::span<const uint8_t> encodedBuffer, uint32_t& outWidth,
+    uint32_t& outHeight);
+
+/// Throws StatusError if the buffer doesn't match the declared shape,
+/// channels != 3, or dimensions exceed `kMaxImageDimension`.
+void validateRawRgb(
+    std::span<const uint8_t> rawBuffer, uint32_t width, uint32_t height,
+    uint32_t channels);
+
+/// Bilinear resize (stb_image_resize2) to `kInputSize` square.
+std::vector<uint8_t> resizeToInput(
+    std::span<const uint8_t> srcRgb, uint32_t srcWidth, uint32_t srcHeight);
+
+/// `kInputSize` × `kInputSize` RGB → FP32 WHCN tensor, ImageNet-normalized.
+std::vector<float> normalizeToWhcn(std::span<const uint8_t> rgb224);
+
+/// Full pipeline: encoded-or-raw buffer → FP32 WHCN tensor.
+std::vector<float> preprocessToTensor(
+    std::span<const uint8_t> input, uint32_t declaredWidth,
+    uint32_t declaredHeight, uint32_t declaredChannels);
+
+} // namespace classification_ggml::preprocess
diff --git a/packages/classification-ggml/addon/src/model-interface/MobileNetGraph.cpp b/packages/classification-ggml/addon/src/model-interface/MobileNetGraph.cpp
new file mode 100644
index 0000000000..9eaf3009b0
--- /dev/null
+++ b/packages/classification-ggml/addon/src/model-interface/MobileNetGraph.cpp
@@ -0,0 +1,644 @@
+#include "MobileNetGraph.hpp"
+
+#include <algorithm>
+#include <cmath>
+#include <cstdint>
+#include <cstring>
+#include <memory>
+#include <stdexcept>
+#include <string>
+#include <unordered_map>
+#include <vector>
+
+#include <ggml-alloc.h>
+#include <ggml-backend.h>
+#include <ggml.h>
+#include <gguf.h>
+
+#include <inference-addon-cpp/Errors.hpp>
+
+namespace classification_ggml::graph {
+
+namespace {
+
+using qvac_errors::StatusError;
+using qvac_errors::general_error::InternalError;
+using qvac_errors::general_error::InvalidArgument;
+
+[[noreturn]] void raise(const std::string& msg) {
+  throw StatusError(InternalError, msg);
+}
+
+[[noreturn]] void raiseInvalid(const std::string& msg) {
+  throw StatusError(InvalidArgument, msg);
+}
+
+// FP16 tensors are storage-only; runtime-math tensors (BN scale/shift,
+// FC weights) are promoted to F32 at load time so the graph never casts.
+
+void fp16ToFp32(const void* src, float* out, size_t count) {
+  const auto* halfPtr = static_cast<const ggml_fp16_t*>(src);
+  for (size_t i = 0; i < count; ++i) {
+    out[i] = ggml_fp16_to_fp32(halfPtr[i]);
+  }
+}
+
+struct ggml_tensor* cloneRaw(
+    struct ggml_context* bundleCtx, const gguf_context* gguf,
+    struct ggml_context* ggufCtx, const char* name) {
+  const int idx = gguf_find_tensor(gguf, name);
+  if (idx < 0) {
+    raise(std::string("Missing tensor in GGUF: ") + name);
+  }
+  struct ggml_tensor* src = ggml_get_tensor(ggufCtx, name);
+  if (src == nullptr) {
+    raise(std::string("Cannot resolve tensor from ggml ctx: ") + name);
+  }
+  struct ggml_tensor* dst =
+      ggml_new_tensor(bundleCtx, src->type, ggml_n_dims(src), src->ne);
+  ggml_set_name(dst, name);
+  return dst;
+}
+
+/// Like cloneRaw but forces the destination dtype to F32.
+struct ggml_tensor* cloneAsFp32(
+    struct ggml_context* bundleCtx, const char* name, int n_dims,
+    const int64_t* ne) {
+  struct ggml_tensor* dst = ggml_new_tensor(bundleCtx, GGML_TYPE_F32, n_dims, ne);
+  ggml_set_name(dst, name);
+  return dst;
+}
+
+// torchvision same-padding: p = (k - 1) / 2.
+constexpr int samePadding(int kernel) {
+  return (kernel - 1) / 2;
+}
+
+/// Read a GGUF tensor (FP16 or FP32) into an FP32 vector.
+std::vector<float> loadVector1d(
+    const gguf_context* gguf, struct ggml_context* ggufCtx,
+    const std::string& name) {
+  (void)gguf;
+  struct ggml_tensor* t = ggml_get_tensor(ggufCtx, name.c_str());
+  if (t == nullptr) {
+    raise("Missing BN tensor: " + name);
+  }
+  const size_t count = ggml_nelements(t);
+  std::vector<float> out(count);
+  if (t->type == GGML_TYPE_F32) {
+    std::memcpy(out.data(), t->data, count * sizeof(float));
+  } else if (t->type == GGML_TYPE_F16) {
+    fp16ToFp32(t->data, out.data(), count);
+  } else {
+    raise("Unsupported BN tensor dtype for: " + name);
+  }
+  return out;
+}
+
+/// Folded BN: `x * scale + shift`, scale/shift pre-reshaped to [1,1,C,1].
+struct ggml_tensor* applyFoldedBn(
+    struct ggml_context* ctx, struct ggml_tensor* x,
+    struct ggml_tensor* scale, struct ggml_tensor* shift) {
+  struct ggml_tensor* scaled = ggml_mul(ctx, x, scale);
+  return ggml_add(ctx, scaled, shift);
+}
+
+struct GraphBuilder {
+  struct ggml_context* ctx;
+  const std::unordered_map<std::string, struct ggml_tensor*>& w;
+
+  struct ggml_tensor* t(const std::string& name) const {
+    auto it = w.find(name);
+    if (it == w.end()) {
+      raise("Missing weight tensor at graph build time: " + name);
+    }
+    return it->second;
+  }
+
+  struct ggml_tensor* activate(struct ggml_tensor* x, bool useHardswish) {
+    return useHardswish ? ggml_hardswish(ctx, x) : ggml_relu(ctx, x);
+  }
+
+  /// Conv2d + folded BN [+ optional activation].
+  struct ggml_tensor* convBnAct(
+      struct ggml_tensor* x, const std::string& convPrefix,
+      const std::string& bnPrefix, int stride, int kernel, bool activate,
+      bool useHardswish) {
+    struct ggml_tensor* kernelT = t(convPrefix + ".weight");
+    const int pad = samePadding(kernel);
+    struct ggml_tensor* conv =
+        ggml_conv_2d(ctx, kernelT, x, stride, stride, pad, pad, 1, 1);
+    struct ggml_tensor* bn =
+        applyFoldedBn(ctx, conv, t(bnPrefix + ".scale"), t(bnPrefix + ".shift"));
+    if (!activate) {
+      return bn;
+    }
+    return this->activate(bn, useHardswish);
+  }
+
+  /// Depthwise Conv2d + folded BN + activation.
+  struct ggml_tensor* dwConvBnAct(
+      struct ggml_tensor* x, const std::string& convPrefix,
+      const std::string& bnPrefix, int stride, int kernel, bool useHardswish) {
+    struct ggml_tensor* kernelT = t(convPrefix + ".weight");
+    const int pad = samePadding(kernel);
+    struct ggml_tensor* conv =
+        ggml_conv_2d_dw(ctx, kernelT, x, stride, stride, pad, pad, 1, 1);
+    struct ggml_tensor* bn =
+        applyFoldedBn(ctx, conv, t(bnPrefix + ".scale"), t(bnPrefix + ".shift"));
+    return activate(bn, useHardswish);
+  }
+
+  /// SE: avgpool → 1x1 reduce + ReLU → 1x1 expand + HardSigmoid → mul.
+  struct ggml_tensor* seBlock(
+      struct ggml_tensor* x, const std::string& sePrefix, int spatialHw) {
+    struct ggml_tensor* pooled = ggml_pool_2d(
+        ctx, x, GGML_OP_POOL_AVG, spatialHw, spatialHw, spatialHw, spatialHw,
+        0, 0);
+
+    struct ggml_tensor* fc1 = ggml_conv_2d(
+        ctx, t(sePrefix + ".fc1.weight"), pooled, 1, 1, 0, 0, 1, 1);
+    fc1 = ggml_add(ctx, fc1, t(sePrefix + ".fc1.bias_br"));
+    fc1 = ggml_relu(ctx, fc1);
+
+    struct ggml_tensor* fc2 = ggml_conv_2d(
+        ctx, t(sePrefix + ".fc2.weight"), fc1, 1, 1, 0, 0, 1, 1);
+    fc2 = ggml_add(ctx, fc2, t(sePrefix + ".fc2.bias_br"));
+
+    struct ggml_tensor* gate = ggml_hardsigmoid(ctx, fc2);
+    return ggml_mul(ctx, x, gate);
+  }
+
+  struct ggml_tensor* invertedResidual(
+      struct ggml_tensor* x, const BlockConfig& cfg, int inputSpatialHw) {
+    const std::string base = "features." + std::to_string(cfg.featuresIndex);
+    const bool hasExpand = cfg.expandedChannels != cfg.inputChannels;
+
+    int spatial = inputSpatialHw;
+    struct ggml_tensor* y = x;
+
+    int dwBlockIdx = 0;
+    int seBlockIdx = -1;
+    int projBlockIdx = 0;
+
+    if (hasExpand) {
+      y = convBnAct(
+          y, base + ".block.0.0", base + ".block.0.1",
+          /*stride=*/1, /*kernel=*/1, /*activate=*/true, cfg.useHardswish);
+      dwBlockIdx = 1;
+      if (cfg.useSe) {
+        seBlockIdx = 2;
+        projBlockIdx = 3;
+      } else {
+        projBlockIdx = 2;
+      }
+    } else {
+      dwBlockIdx = 0;
+      if (cfg.useSe) {
+        seBlockIdx = 1;
+        projBlockIdx = 2;
+      } else {
+        projBlockIdx = 1;
+      }
+    }
+
+    const std::string dwPrefix = base + ".block." + std::to_string(dwBlockIdx);
+    y = dwConvBnAct(
+        y, dwPrefix + ".0", dwPrefix + ".1", cfg.stride, cfg.depthwiseKernel,
+        cfg.useHardswish);
+    if (cfg.stride == 2) {
+      spatial = (spatial + 1) / 2;
+    }
+
+    if (cfg.useSe) {
+      const std::string sePrefix =
+          base + ".block." + std::to_string(seBlockIdx);
+      y = seBlock(y, sePrefix, spatial);
+    }
+
+    const std::string projPrefix =
+        base + ".block." + std::to_string(projBlockIdx);
+    y = convBnAct(
+        y, projPrefix + ".0", projPrefix + ".1",
+        /*stride=*/1, /*kernel=*/1, /*activate=*/false, cfg.useHardswish);
+
+    if (cfg.stride == 1 && cfg.inputChannels == cfg.outputChannels) {
+      y = ggml_add(ctx, y, x);
+    }
+    return y;
+  }
+};
+
+} // namespace
+
+WeightsBundle::~WeightsBundle() { reset(); }
+
+WeightsBundle::WeightsBundle(WeightsBundle&& other) noexcept
+    : ctx(std::move(other.ctx)),
+      tensors(std::move(other.tensors)),
+      backendBuffer(other.backendBuffer) {
+  other.backendBuffer = nullptr;
+}
+
+WeightsBundle& WeightsBundle::operator=(WeightsBundle&& other) noexcept {
+  if (this != &other) {
+    reset();
+    ctx = std::move(other.ctx);
+    tensors = std::move(other.tensors);
+    backendBuffer = other.backendBuffer;
+    other.backendBuffer = nullptr;
+  }
+  return *this;
+}
+
+void WeightsBundle::reset() {
+  tensors.clear();
+  ctx.reset();
+  if (backendBuffer != nullptr) {
+    ggml_backend_buffer_free(backendBuffer);
+    backendBuffer = nullptr;
+  }
+}
+
+ComputeGraph::~ComputeGraph() { reset(); }
+
+ComputeGraph::ComputeGraph(ComputeGraph&& other) noexcept
+    : ctx(std::move(other.ctx)),
+      graph(other.graph),
+      input(other.input),
+      output(other.output),
+      backendBuffer(other.backendBuffer) {
+  other.graph = nullptr;
+  other.input = nullptr;
+  other.output = nullptr;
+  other.backendBuffer = nullptr;
+}
+
+ComputeGraph& ComputeGraph::operator=(ComputeGraph&& other) noexcept {
+  if (this != &other) {
+    reset();
+    ctx = std::move(other.ctx);
+    graph = other.graph;
+    input = other.input;
+    output = other.output;
+    backendBuffer = other.backendBuffer;
+    other.graph = nullptr;
+    other.input = nullptr;
+    other.output = nullptr;
+    other.backendBuffer = nullptr;
+  }
+  return *this;
+}
+
+void ComputeGraph::reset() {
+  graph = nullptr;
+  input = nullptr;
+  output = nullptr;
+  ctx.reset();
+  if (backendBuffer != nullptr) {
+    ggml_backend_buffer_free(backendBuffer);
+    backendBuffer = nullptr;
+  }
+}
+
+WeightsBundle loadWeights(
+    const std::string& ggufPath, ggml_backend_t backend,
+    std::vector<std::string>& outLabels) {
+  outLabels.clear();
+  struct ggml_context* ggufCtx = nullptr;
+  gguf_init_params params{/*no_alloc=*/false, &ggufCtx};
+  gguf_context* gguf = gguf_init_from_file(ggufPath.c_str(), params);
+  if (gguf == nullptr) {
+    raiseInvalid("Failed to open GGUF file: " + ggufPath);
+  }
+  std::unique_ptr<gguf_context, decltype(&gguf_free)> ggufGuard(gguf, gguf_free);
+  std::unique_ptr<struct ggml_context, decltype(&ggml_free)> ggufCtxGuard(
+      ggufCtx, ggml_free);
+
+  // Default to the architecture-standard 0.001 (PyTorch's BN default).
+  // Never silently fall back to torchvision's 1e-5 reference value.
+  float bnEps = kBatchNormEpsilon;
+  {
+    const int64_t epsIdx = gguf_find_key(gguf, "mobilenet.bn_eps");
+    if (epsIdx >= 0) {
+      bnEps = gguf_get_val_f32(gguf, static_cast<int>(epsIdx));
+    }
+  }
+
+  {
+    uint32_t numClasses = kNumClasses;
+    const int64_t idxN = gguf_find_key(gguf, "mobilenet.num_classes");
+    if (idxN >= 0) {
+      numClasses = gguf_get_val_u32(gguf, static_cast<int>(idxN));
+    }
+    // Mismatch silently corrupts the classifier upload and the per-call
+    // tensor_get; reject up front.
+    if (numClasses != kNumClasses) {
+      raiseInvalid(
+          "GGUF metadata 'mobilenet.num_classes' (" +
+          std::to_string(numClasses) +
+          ") does not match the addon's compiled-in class count (" +
+          std::to_string(kNumClasses) +
+          "); rebuild @qvac/classification-ggml against this model or use "
+          "a GGUF with the expected number of classes");
+    }
+    for (uint32_t i = 0; i < numClasses; ++i) {
+      const std::string key = "mobilenet.class_" + std::to_string(i);
+      const int64_t idx = gguf_find_key(gguf, key.c_str());
+      if (idx < 0) {
+        outLabels.clear();
+        break;
+      }
+      outLabels.emplace_back(gguf_get_val_str(gguf, static_cast<int>(idx)));
+    }
+  }
+
+  WeightsBundle bundle;
+  const size_t ctxSize = ggml_tensor_overhead() * 4096;
+  bundle.ctx = std::unique_ptr<struct ggml_context, decltype(&ggml_free)>(
+      ggml_init({ctxSize, nullptr, /*no_alloc=*/true}), ggml_free);
+  if (!bundle.ctx) {
+    raise("Failed to allocate weights ggml context");
+  }
+
+  auto& tensors = bundle.tensors;
+
+  auto registerTensor = [&](struct ggml_tensor* dst) {
+    tensors.emplace(ggml_get_name(dst), dst);
+  };
+
+  auto addConvWeight = [&](const std::string& name) {
+    struct ggml_tensor* t = cloneRaw(bundle.ctx.get(), gguf, ggufCtx, name.c_str());
+    registerTensor(t);
+  };
+
+  // SE bias is registered twice: 1D raw (used by unit tests) and an F32
+  // [1,1,C,1] broadcast view (consumed by the graph against 4D feature maps).
+  auto addSeBiasBroadcast = [&](const std::string& name, int channels) {
+    struct ggml_tensor* raw =
+        cloneRaw(bundle.ctx.get(), gguf, ggufCtx, name.c_str());
+    registerTensor(raw);
+
+    const int64_t shape4d[4] = {1, 1, channels, 1};
+    const std::string brName = name + "_br";
+    struct ggml_tensor* br = cloneAsFp32(bundle.ctx.get(), brName.c_str(), 4, shape4d);
+    tensors.emplace(brName, br);
+  };
+
+  // Fold BN at load time: replaces ~34 per-inference sqrt + 4-op chains.
+  auto addFoldedBn = [&](const std::string& bnPrefix, int channels) {
+    const int64_t shape4d[4] = {1, 1, channels, 1};
+    struct ggml_tensor* scale =
+        cloneAsFp32(bundle.ctx.get(), (bnPrefix + ".scale").c_str(), 4, shape4d);
+    struct ggml_tensor* shift =
+        cloneAsFp32(bundle.ctx.get(), (bnPrefix + ".shift").c_str(), 4, shape4d);
+    tensors.emplace(bnPrefix + ".scale", scale);
+    tensors.emplace(bnPrefix + ".shift", shift);
+  };
+
+  auto addFcWeightFp32 = [&](const std::string& name, int in, int out) {
+    const int64_t shape[2] = {in, out};
+    struct ggml_tensor* t = cloneAsFp32(bundle.ctx.get(), name.c_str(), 2, shape);
+    tensors.emplace(name, t);
+  };
+  auto addFcBiasFp32 = [&](const std::string& name, int out) {
+    const int64_t shape[1] = {out};
+    struct ggml_tensor* t = cloneAsFp32(bundle.ctx.get(), name.c_str(), 1, shape);
+    tensors.emplace(name, t);
+  };
+
+  addConvWeight("features.0.0.weight");
+  addFoldedBn("features.0.1", kStemOutChannels);
+
+  for (const BlockConfig& cfg : kBlocks) {
+    const std::string base = "features." + std::to_string(cfg.featuresIndex);
+    const bool hasExpand = cfg.expandedChannels != cfg.inputChannels;
+    int dwIdx = 0;
+    int seIdx = -1;
+    int projIdx = 0;
+    if (hasExpand) {
+      addConvWeight(base + ".block.0.0.weight");
+      addFoldedBn(base + ".block.0.1", cfg.expandedChannels);
+      dwIdx = 1;
+      if (cfg.useSe) {
+        seIdx = 2;
+        projIdx = 3;
+      } else {
+        projIdx = 2;
+      }
+    } else {
+      if (cfg.useSe) {
+        seIdx = 1;
+        projIdx = 2;
+      } else {
+        projIdx = 1;
+      }
+    }
+    const std::string dwBase = base + ".block." + std::to_string(dwIdx);
+    addConvWeight(dwBase + ".0.weight");
+    addFoldedBn(dwBase + ".1", cfg.expandedChannels);
+
+    if (cfg.useSe) {
+      const std::string seBase = base + ".block." + std::to_string(seIdx);
+      addConvWeight(seBase + ".fc1.weight");
+      addSeBiasBroadcast(seBase + ".fc1.bias", cfg.seReducedChannels);
+      addConvWeight(seBase + ".fc2.weight");
+      addSeBiasBroadcast(seBase + ".fc2.bias", cfg.expandedChannels);
+    }
+
+    const std::string projBase = base + ".block." + std::to_string(projIdx);
+    addConvWeight(projBase + ".0.weight");
+    addFoldedBn(projBase + ".1", cfg.outputChannels);
+  }
+
+  addConvWeight("features.12.0.weight");
+  addFoldedBn("features.12.1", kTailOutChannels);
+
+  addFcWeightFp32("classifier.0.weight", kTailOutChannels, kClassifierHidden);
+  addFcBiasFp32("classifier.0.bias", kClassifierHidden);
+  addFcWeightFp32("classifier.3.weight", kClassifierHidden, kNumClasses);
+  addFcBiasFp32("classifier.3.bias", kNumClasses);
+
+  bundle.backendBuffer =
+      ggml_backend_alloc_ctx_tensors(bundle.ctx.get(), backend);
+  if (bundle.backendBuffer == nullptr) {
+    raise("Failed to allocate backend buffer for weights");
+  }
+
+  // First pass: raw byte copies for storage-only tensors. Folded/promoted
+  // tensors are filled by foldBn / foldSeBias / uploadClassifierTensor below.
+  for (auto& [name, dst] : tensors) {
+    if (name.ends_with(".scale") || name.ends_with(".shift") ||
+        name.ends_with(".bias_br") || name == "classifier.0.weight" ||
+        name == "classifier.0.bias" || name == "classifier.3.weight" ||
+        name == "classifier.3.bias") {
+      continue;
+    }
+    struct ggml_tensor* src = ggml_get_tensor(ggufCtx, name.c_str());
+    if (src == nullptr) {
+      raise("Source tensor missing from GGUF: " + name);
+    }
+    if (src->type != dst->type) {
+      raise("Dtype mismatch while copying tensor: " + name);
+    }
+    ggml_backend_tensor_set(dst, src->data, 0, ggml_nbytes(src));
+  }
+
+  auto uploadF32 = [&](struct ggml_tensor* dst, const std::vector<float>& buf) {
+    if (static_cast<size_t>(ggml_nelements(dst)) != buf.size()) {
+      raise(
+          std::string("Element count mismatch for ") + ggml_get_name(dst) +
+          ": expected " + std::to_string(ggml_nelements(dst)) + ", got " +
+          std::to_string(buf.size()));
+    }
+    ggml_backend_tensor_set(dst, buf.data(), 0, buf.size() * sizeof(float));
+  };
+
+  auto foldBn = [&](const std::string& bnPrefix) {
+    std::vector<float> w =
+        loadVector1d(gguf, ggufCtx, bnPrefix + ".weight");
+    std::vector<float> b =
+        loadVector1d(gguf, ggufCtx, bnPrefix + ".bias");
+    std::vector<float> m =
+        loadVector1d(gguf, ggufCtx, bnPrefix + ".running_mean");
+    std::vector<float> v =
+        loadVector1d(gguf, ggufCtx, bnPrefix + ".running_var");
+    const size_t n = w.size();
+    if (b.size() != n || m.size() != n || v.size() != n) {
+      raise("BN param size mismatch for " + bnPrefix);
+    }
+    std::vector<float> scale(n);
+    std::vector<float> shift(n);
+    for (size_t i = 0; i < n; ++i) {
+      const float invStd = 1.0F / std::sqrt(v[i] + bnEps);
+      scale[i] = w[i] * invStd;
+      shift[i] = b[i] - m[i] * scale[i];
+    }
+    uploadF32(tensors.at(bnPrefix + ".scale"), scale);
+    uploadF32(tensors.at(bnPrefix + ".shift"), shift);
+  };
+
+  auto foldSeBias = [&](const std::string& biasName) {
+    std::vector<float> b = loadVector1d(gguf, ggufCtx, biasName);
+    uploadF32(tensors.at(biasName + "_br"), b);
+  };
+
+  foldBn("features.0.1");
+  for (const BlockConfig& cfg : kBlocks) {
+    const std::string base = "features." + std::to_string(cfg.featuresIndex);
+    const bool hasExpand = cfg.expandedChannels != cfg.inputChannels;
+    int dwIdx = 0;
+    int seIdx = -1;
+    int projIdx = 0;
+    if (hasExpand) {
+      foldBn(base + ".block.0.1");
+      dwIdx = 1;
+      if (cfg.useSe) {
+        seIdx = 2;
+        projIdx = 3;
+      } else {
+        projIdx = 2;
+      }
+    } else {
+      if (cfg.useSe) {
+        seIdx = 1;
+        projIdx = 2;
+      } else {
+        projIdx = 1;
+      }
+    }
+    foldBn(base + ".block." + std::to_string(dwIdx) + ".1");
+    if (cfg.useSe) {
+      const std::string seBase = base + ".block." + std::to_string(seIdx);
+      foldSeBias(seBase + ".fc1.bias");
+      foldSeBias(seBase + ".fc2.bias");
+    }
+    foldBn(base + ".block." + std::to_string(projIdx) + ".1");
+  }
+  foldBn("features.12.1");
+
+  auto uploadClassifierTensor = [&](const std::string& name) {
+    std::vector<float> buf = loadVector1d(gguf, ggufCtx, name);
+    uploadF32(tensors.at(name), buf);
+  };
+  uploadClassifierTensor("classifier.0.weight");
+  uploadClassifierTensor("classifier.0.bias");
+  uploadClassifierTensor("classifier.3.weight");
+  uploadClassifierTensor("classifier.3.bias");
+
+  return bundle;
+}
+
+ComputeGraph buildGraph(const WeightsBundle& weights, ggml_backend_t backend) {
+  ComputeGraph cg;
+  const size_t ctxSize = ggml_tensor_overhead() * 4096 + ggml_graph_overhead();
+  cg.ctx = std::unique_ptr<struct ggml_context, decltype(&ggml_free)>(
+      ggml_init({ctxSize, nullptr, /*no_alloc=*/true}), ggml_free);
+  if (!cg.ctx) {
+    raise("Failed to allocate graph ggml context");
+  }
+  struct ggml_context* ctx = cg.ctx.get();
+
+  // WHCN: width, height, channels, batch.
+  cg.input =
+      ggml_new_tensor_4d(ctx, GGML_TYPE_F32, kInputHw, kInputHw, 3, 1);
+  ggml_set_name(cg.input, "input");
+
+  GraphBuilder gb{ctx, weights.tensors};
+
+  struct ggml_tensor* x = gb.convBnAct(
+      cg.input, "features.0.0", "features.0.1", /*stride=*/2, /*kernel=*/3,
+      /*activate=*/true, /*useHardswish=*/true);
+
+  int spatial = kInputHw / 2;
+
+  for (const BlockConfig& cfg : kBlocks) {
+    x = gb.invertedResidual(x, cfg, spatial);
+    if (cfg.stride == 2) {
+      spatial = (spatial + 1) / 2;
+    }
+  }
+
+  x = gb.convBnAct(
+      x, "features.12.0", "features.12.1", /*stride=*/1, /*kernel=*/1,
+      /*activate=*/true, /*useHardswish=*/true);
+
+  struct ggml_tensor* pooled = ggml_pool_2d(
+      ctx, x, GGML_OP_POOL_AVG, spatial, spatial, spatial, spatial, 0, 0);
+  struct ggml_tensor* flat = ggml_reshape_1d(ctx, pooled, kTailOutChannels);
+
+  struct ggml_tensor* fc0 = ggml_mul_mat(
+      ctx, gb.t("classifier.0.weight"), flat);
+  fc0 = ggml_add(ctx, fc0, gb.t("classifier.0.bias"));
+  fc0 = ggml_hardswish(ctx, fc0);
+
+  struct ggml_tensor* fc3 = ggml_mul_mat(
+      ctx, gb.t("classifier.3.weight"), fc0);
+  fc3 = ggml_add(ctx, fc3, gb.t("classifier.3.bias"));
+
+  cg.output = fc3;
+  ggml_set_name(cg.output, "logits");
+
+  // The warmup and process() paths both read sizeof(float)*kNumClasses
+  // bytes from cg.output; mismatch silently truncates or reads OOB.
+  if (ggml_nelements(cg.output) != static_cast<int64_t>(kNumClasses)) {
+    raise(
+        "Compute graph output has " +
+        std::to_string(ggml_nelements(cg.output)) +
+        " elements, expected " + std::to_string(kNumClasses) +
+        "; classifier wiring or GGUF weight shapes are inconsistent with "
+        "graph::kNumClasses");
+  }
+
+  cg.graph = ggml_new_graph_custom(ctx, 8192, /*grads=*/false);
+  ggml_build_forward_expand(cg.graph, cg.output);
+
+  cg.backendBuffer = ggml_backend_alloc_ctx_tensors(ctx, backend);
+  if (cg.backendBuffer == nullptr) {
+    raise("Failed to allocate backend buffer for compute graph");
+  }
+
+  return cg;
+}
+
+} // namespace classification_ggml::graph
diff --git a/packages/classification-ggml/addon/src/model-interface/MobileNetGraph.hpp b/packages/classification-ggml/addon/src/model-interface/MobileNetGraph.hpp
new file mode 100644
index 0000000000..3982354fec
--- /dev/null
+++ b/packages/classification-ggml/addon/src/model-interface/MobileNetGraph.hpp
@@ -0,0 +1,99 @@
+#pragma once
+
+#include <array>
+#include <cstdint>
+#include <memory>
+#include <string>
+#include <unordered_map>
+#include <vector>
+
+#include <ggml-backend.h>
+#include <ggml.h>
+
+namespace classification_ggml::graph {
+
+/// One torchvision MobileNetV3-Small `InvertedResidual` block.
+struct BlockConfig {
+  int featuresIndex;   // 1..11, matches `features.N` in the GGUF
+  int inputChannels;
+  int expandedChannels;
+  int outputChannels;
+  int depthwiseKernel; // 3 or 5
+  int stride;          // 1 or 2
+  bool useHardswish;   // false = ReLU
+  bool useSe;
+  int seReducedChannels;
+};
+
+inline constexpr int kNumBlocks = 11;
+inline constexpr std::array<BlockConfig, kNumBlocks> kBlocks = {{
+    // idx  inC  expC  outC  k  s  hs     se     seR
+    {1, 16, 16, 16, 3, 2, false, true, 8},
+    {2, 16, 72, 24, 3, 2, false, false, 0},
+    {3, 24, 88, 24, 3, 1, false, false, 0},
+    {4, 24, 96, 40, 5, 2, true, true, 24},
+    {5, 40, 240, 40, 5, 1, true, true, 64},
+    {6, 40, 240, 40, 5, 1, true, true, 64},
+    {7, 40, 120, 48, 5, 1, true, true, 32},
+    {8, 48, 144, 48, 5, 1, true, true, 40},
+    {9, 48, 288, 96, 5, 2, true, true, 72},
+    {10, 96, 576, 96, 5, 1, true, true, 144},
+    {11, 96, 576, 96, 5, 1, true, true, 144},
+}};
+
+inline constexpr int kStemOutChannels = 16;
+inline constexpr int kTailOutChannels = 576;
+inline constexpr int kClassifierHidden = 1024;
+inline constexpr int kNumClasses = 3;
+inline constexpr float kBatchNormEpsilon = 0.001F;
+inline constexpr int kInputHw = 224;
+
+/// ggml context + name→tensor map for every weight, plus the backing
+/// backend buffer. Lives for the entire model lifetime.
+struct WeightsBundle {
+  std::unique_ptr<struct ggml_context, decltype(&ggml_free)> ctx{
+      nullptr, ggml_free};
+  std::unordered_map<std::string, struct ggml_tensor*> tensors;
+  ggml_backend_buffer_t backendBuffer = nullptr;
+
+  WeightsBundle() = default;
+  WeightsBundle(const WeightsBundle&) = delete;
+  WeightsBundle& operator=(const WeightsBundle&) = delete;
+  WeightsBundle(WeightsBundle&& other) noexcept;
+  WeightsBundle& operator=(WeightsBundle&& other) noexcept;
+  ~WeightsBundle();
+
+  void reset();
+};
+
+/// Compute graph + its ggml context. Input/output tensors are reused
+/// across classify() calls; only input pixel data is rewritten per call.
+struct ComputeGraph {
+  std::unique_ptr<struct ggml_context, decltype(&ggml_free)> ctx{
+      nullptr, ggml_free};
+  struct ggml_cgraph* graph = nullptr;
+  struct ggml_tensor* input = nullptr;
+  struct ggml_tensor* output = nullptr;
+  ggml_backend_buffer_t backendBuffer = nullptr;
+
+  ComputeGraph() = default;
+  ComputeGraph(const ComputeGraph&) = delete;
+  ComputeGraph& operator=(const ComputeGraph&) = delete;
+  ComputeGraph(ComputeGraph&& other) noexcept;
+  ComputeGraph& operator=(ComputeGraph&& other) noexcept;
+  ~ComputeGraph();
+
+  void reset();
+};
+
+/// Loads every tensor + the `mobilenet.class_N` labels from a GGUF file.
+/// `outLabels` is left empty if the metadata keys are not present.
+WeightsBundle loadWeights(
+    const std::string& ggufPath, ggml_backend_t backend,
+    std::vector<std::string>& outLabels);
+
+/// Build the MobileNetV3-Small forward graph. Caller writes pixels into
+/// `graph.input` via `ggml_backend_tensor_set` before each compute.
+ComputeGraph buildGraph(const WeightsBundle& weights, ggml_backend_t backend);
+
+} // namespace classification_ggml::graph
diff --git a/packages/classification-ggml/binding.js b/packages/classification-ggml/binding.js
new file mode 100644
index 0000000000..cea46308c0
--- /dev/null
+++ b/packages/classification-ggml/binding.js
@@ -0,0 +1 @@
+module.exports = require.addon()
diff --git a/packages/classification-ggml/docs/architecture.md b/packages/classification-ggml/docs/architecture.md
new file mode 100644
index 0000000000..0c60092ea5
--- /dev/null
+++ b/packages/classification-ggml/docs/architecture.md
@@ -0,0 +1,190 @@
+# Architecture — `@qvac/classification-ggml`
+
+This document describes the architecture of the MobileNetV3-Small 3-class
+image classification addon, the GGML compute graph it constructs, and the
+rationale for the key implementation choices.
+
+## Component layout
+
+```
++----------------------------------------------+
+|  JS: ImageClassifier (index.js)              |
+|   - lifecycle (load / classify / unload)     |
+|     all serialised via exclusiveRunQueue     |
+|   - createJobHandler + QvacResponse plumbing |
+|   - thin pass-through to native validation   |
++----------------------------------------------+
+|  JS: ClassificationInterface (addon.js)      |
+|   - thin native bridge: createInstance,      |
+|     activate, runJob, cancel, unload         |
+|   - exports mapAddonEvent for index.js       |
+|     (shape-keyed Output / JobEnded routing)  |
++----------------------------------------------+
+|  Native: BARE_MODULE (binding.cpp)           |
+|   - exports createInstance/runJob/activate… |
++----------------------------------------------+
+|  Native: AddonJs (addon/AddonJs.hpp)         |
+|   - js <-> C++ bridge                        |
+|   - single source of truth for argument      |
+|     validation (type / range / shape)        |
+|   - packs ClassifyInput (vector<uint8_t> +   |
+|     optional<RawRgbDims> + topK)             |
+|   - JsClassifyOutputHandler → JS array       |
++----------------------------------------------+
+|  Native: AddonCpp  (from @qvac/…-addon-cpp)  |
+|   - JobRunner (dedicated worker thread)      |
+|   - OutputQueue + OutputCallback plumbing    |
++----------------------------------------------+
+|  Native: ClassificationModel (IModel)        |
+|   - load(): backend init + weights + graph   |
+|     + full-pipeline warmup pass              |
+|     desktop/iOS: ggml_backend_cpu_init()     |
+|     android   : load_all_from_path(<dir>) +  |
+|                 dev_by_type(CPU) + dev_init  |
+|   - process(): preprocess → compute → softmax|
++----------------------------------------------+
+|  Native: MobileNetGraph                      |
+|   - loadWeights(): GGUF → folded BN + FC F32 |
+|     (validates mobilenet.num_classes)        |
+|   - buildGraph(): static forward compute     |
+|     graph wired to pre-allocated buffers     |
+|     (asserts ggml_nelements(output) ==       |
+|     kNumClasses before allocation)           |
++----------------------------------------------+
+|  libggml (CPU backend only, via qvac-fabric) |
+|   - desktop/iOS: CPU statically linked into  |
+|     the .bare                                |
+|   - android: per-microarch CPU MODULE .so    |
+|     ships next to the .bare under            |
+|     prebuilds/android-arm64/qvac__…/         |
++----------------------------------------------+
+```
+
+## MobileNetV3-Small layer list
+
+The graph matches `torchvision.models.mobilenet_v3_small` with the bundled
+3-class classifier head. Spatial dimensions start at `224×224` and halve
+at each stride-2 layer.
+
+| Stage          | Op                                    | In    | Out   | Spatial |
+|----------------|---------------------------------------|-------|-------|---------|
+| `features.0`   | Conv2dBN + HardSwish (3×3, s=2)       | 3     | 16    | 112     |
+| `features.1`   | InvertedResidual (DW 3×3 s=2, SE, ReLU) | 16 | 16    | 56      |
+| `features.2`   | InvertedResidual (exp→72, DW 3×3 s=2, ReLU) | 16 | 24 | 28      |
+| `features.3`   | InvertedResidual (exp→88, DW 3×3 s=1, ReLU, +) | 24 | 24 | 28    |
+| `features.4`   | InvertedResidual (exp→96, DW 5×5 s=2, SE, HS)  | 24 | 40 | 14     |
+| `features.5`   | InvertedResidual (exp→240, DW 5×5 s=1, SE, HS, +) | 40 | 40 | 14  |
+| `features.6`   | InvertedResidual (exp→240, DW 5×5 s=1, SE, HS, +) | 40 | 40 | 14  |
+| `features.7`   | InvertedResidual (exp→120, DW 5×5 s=1, SE, HS)    | 40 | 48 | 14  |
+| `features.8`   | InvertedResidual (exp→144, DW 5×5 s=1, SE, HS, +) | 48 | 48 | 14  |
+| `features.9`   | InvertedResidual (exp→288, DW 5×5 s=2, SE, HS)    | 48 | 96 | 7   |
+| `features.10`  | InvertedResidual (exp→576, DW 5×5 s=1, SE, HS, +) | 96 | 96 | 7   |
+| `features.11`  | InvertedResidual (exp→576, DW 5×5 s=1, SE, HS, +) | 96 | 96 | 7   |
+| `features.12`  | Conv2dBN + HardSwish (1×1)            | 96    | 576   | 7       |
+| avg-pool       | GlobalAveragePool                     | 576   | 576   | 1       |
+| `classifier.0` | Linear + HardSwish                    | 576   | 1024  | 1       |
+| `classifier.3` | Linear                                | 1024  | 3     | 1       |
+
+Totals: **34 conv layers** (1 stem + 11 × {1 or 2 1×1 + 1 DW} + 1 tail)
+and **2 linear layers** in the classifier. `+` marks the residual add
+(applied when `stride == 1` and `inputChannels == outputChannels`).
+
+## GGML graph construction
+
+### Weight loading
+
+`MobileNetGraph::loadWeights()` opens the GGUF file via
+`gguf_init_from_file()` and clones every required tensor into a freshly
+allocated `ggml_context` that is backed by a CPU backend buffer (allocated
+with `ggml_backend_alloc_ctx_tensors`).
+
+Weights are transformed at load time into two layouts:
+
+1. **Raw FP16** (`cloneRaw`) for conv kernels and SE FC kernels — the
+   native `ggml_conv_2d` / `ggml_conv_2d_dw` paths accept F16 kernels
+   against an F32 input on the CPU backend.
+2. **Folded FP32 BN scale/shift** (`cloneAsFp32` + second pass) for every
+   BatchNorm layer. At load time we compute:
+
+   ```
+   scale_c = weight_c / sqrt(running_var_c + 0.001)
+   shift_c = bias_c - running_mean_c * scale_c
+   ```
+
+   and store `scale[1,1,C,1]` and `shift[1,1,C,1]` tensors. The forward
+   graph then applies BN as a single `ggml_mul` + `ggml_add` broadcast.
+
+This fold avoids 34 × 4 ops (`sub`, `div`, `mul`, `add`) per inference and
+sidesteps the classic `eps = 1e-5` mistake by computing the division
+exactly once against the GGUF-supplied `0.001`.
+
+Classifier FC weights and biases are promoted to FP32 on load for
+numerical stability of the tiny 3-element logits tail.
+
+### Forward graph
+
+`MobileNetGraph::buildGraph()` builds a static graph in a second
+`ggml_context` with `no_alloc = true`. The graph is allocated on the
+backend once, wiring up:
+
+- `input` tensor `[W=224, H=224, C=3, N=1] F32`
+- Stem conv + BN + HardSwish
+- 11 `InvertedResidual` blocks (`GraphBuilder::invertedResidual`)
+- Tail conv + BN + HardSwish
+- Global average pool (`ggml_pool_2d` with kernel == spatial extent)
+- Reshape to 1-D (576)
+- `classifier.0.weight` linear + bias + HardSwish
+- `classifier.3.weight` linear + bias → logits
+
+The graph is captured via `ggml_new_graph_custom` + `ggml_build_forward_expand`.
+
+### Per-inference path
+
+`ClassificationModel::process()`:
+
+1. Preprocess the image buffer to a 224×224×3 FP32 WHCN tensor.
+2. `ggml_backend_tensor_set(input, fp32Buffer)` — copies pixels only.
+3. `ggml_backend_graph_compute(backend, graph)`.
+4. `ggml_backend_tensor_get(output, logits)`.
+5. Numerically stable softmax over 3 logits in C++.
+6. Build sorted `ClassifyResult` list, apply `topK`, return.
+
+Nothing allocates tensors in the hot path; the only per-call work is the
+pixel copy, the compute itself, the 3-element softmax, and label lookup.
+
+## Threading model
+
+- Each `ClassificationModel` instance owns its own `JobRunner` worker
+  thread (inherited from `qvac-lib-inference-addon-cpp`), so concurrent
+  `classify()` calls are serialized per instance but independent across
+  instances — supporting acceptance criterion N6.
+- The JS-side `exclusiveRunQueue()` (mirroring `LlmLlamacpp`) further
+  serialises `load`, `classify`, and `unload` per `ImageClassifier`
+  instance, so a `unload()` racing an in-flight `classify()` queues
+  cleanly behind it (and explicitly cancels then fails the in-flight
+  request with `Model was unloaded`).
+- Per-inference mutex (`ClassificationModel::mutex_`) guards against a
+  torn state if a future user bypasses `JobRunner`.
+- The CPU compute thread count is left at libggml's default
+  (`std::thread::hardware_concurrency`) on every platform; the addon
+  does not expose a `threads` knob. Rationale: on Apple/Linux/Windows
+  desktop the symbol `ggml_backend_cpu_set_n_threads` is statically
+  linkable, but on Android the CPU backend is loaded as a per-microarch
+  MODULE `.so` (`GGML_CPU_ALL_VARIANTS=ON`) where the setter is not
+  resolvable from the addon's `.bare`, so a `threads` config value
+  could only ever apply on a subset of platforms. We picked
+  consistency and dropped the knob altogether.
+
+## Memory footprint
+
+- Weights on the CPU backend: ≈ `2.94 MB` + ≈ `60 KB` of folded BN scale/
+  shift + FP32 classifier FC (≈ `2.5 MB`) ≈ **5.5 MB total** in memory.
+- Compute buffer (intermediate activations): single-digit MB for a
+  224×224 input — allocated once at `load()` time.
+- No heap allocation inside the hot path.
+
+## References
+
+- Howard et al., *Searching for MobileNetV3*, arXiv:1905.02244, 2019.
+- `torchvision.models.mobilenet_v3_small` — reference architecture.
+- GGML public API: `ggml.h`, `ggml-backend.h`, `ggml-alloc.h`, `gguf.h`.
diff --git a/packages/classification-ggml/docs/data-flow.md b/packages/classification-ggml/docs/data-flow.md
new file mode 100644
index 0000000000..310561f9c0
--- /dev/null
+++ b/packages/classification-ggml/docs/data-flow.md
@@ -0,0 +1,191 @@
+# Data flow — `@qvac/classification-ggml`
+
+End-to-end trace of a single `classifier.classify(buffer)` call.
+
+```
++-------------------------+
+|  Caller                 |
+|  classifier.classify(   |
+|    imageBuffer, opts)   |
++-----------+-------------+
+            |  JPEG/PNG/raw RGB bytes + {topK?, width?, height?, channels?}
+            v
++-------------------------+
+|  ImageClassifier (JS)   |
+|  - lifecycle gates      |
+|    (load / classify /   |
+|    unload all serialised|
+|    via exclusiveRunQueue)|
+|  - thin pass-through:   |
+|    builds native job    |
+|    { type: 'image',     |
+|      content: buf,      |
+|      width?, height?,   |
+|      channels?, topK? } |
++-----------+-------------+
+            |
+            v
++-------------------------+
+|  ClassificationInterface|
+|  (addon.js)             |
+|  - createInstance once  |
+|  - binding.runJob(...)  |
+|  - native events fan    |
+|    out via mapAddonEvent|
++-----------+-------------+
+            |
+            v
++-------------------------+
+|  Native binding.cpp     |
+|  - resolves addon handle|
+|  - calls js::runJob     |
++-----------+-------------+
+            |
+            v
++-------------------------+
+|  AddonJs::runJob (C++)  |
+|  Single source of truth |
+|  for argument validation|
+|  - type === 'image'     |
+|  - content is TypedArray|
+|  - width/height/channels|
+|    all-or-nothing trio  |
+|  - topK > 0 if provided |
+|  - bare-runtime int32   |
+|    range checks         |
+|  Throws StatusError     |
+|  (InvalidArgument) on   |
+|  any violation.         |
+|  - packs ClassifyInput  |
+|    (vector<uint8_t> +   |
+|    optional<RawRgbDims> |
+|    + topK)              |
+|  - AddonCpp.runJob(any) |
++-----------+-------------+
+            |
+            |  ClassifyInput
+            v
++-------------------------+
+|  JobRunner worker thread|
+|  - pops job             |
+|  - model->process(any)  |
++-----------+-------------+
+            |
+            v
++-------------------------+
+|  ClassificationModel::  |
+|  process()              |
+|                         |
+|  1) preprocessToTensor  |
+|     (stb_image decode + |
+|      bilinear resize +  |
+|      ImageNet normalize)|
+|                         |
+|  2) ggml_backend_tensor_|
+|     set(input, fp32buf) |
+|                         |
+|  3) ggml_backend_graph_ |
+|     compute(backend, g) |
+|                         |
+|  4) ggml_backend_tensor_|
+|     get(output, logits) |
+|                         |
+|  5) softmax (C++)       |
+|                         |
+|  6) build sorted result |
++-----------+-------------+
+            |
+            |  ClassifyOutput (std::any)
+            v
++-------------------------+
+|  OutputQueue → Output   |
+|  CallbackJs → JS        |
+|  _outputCallback(event, |
+|   data, error)          |
++-----------+-------------+
+            |
+            v
++-------------------------+
+|  JsClassifyOutputHandler|
+|  ClassifyOutput → JS    |
+|  Array<{label, confid.}>|
++-----------+-------------+
+            |
+            v
++-------------------------+
+|  ImageClassifier (JS)   |
+|  _job.end() on terminal |
+|  → response.await()     |
+|    resolves with        |
+|    collected[0]         |
++-----------+-------------+
+            |
+            v
++-------------------------+
+|  Caller awaits result   |
+|  [{label, confidence}]  |
++-------------------------+
+```
+
+## Error paths
+
+| Failure                                     | Where                                         | Surface behaviour |
+|---------------------------------------------|-----------------------------------------------|-------------------|
+| `null` / non-Buffer / non-Uint8Array input  | `AddonJs::runJob` (C++)                       | `StatusError(InvalidArgument)` — "Image 'content' is required and must be a Uint8Array / Buffer …" |
+| Empty buffer                                | `AddonJs::runJob` (C++)                       | `StatusError(InvalidArgument)` — "Image 'content' buffer is empty" |
+| Unsupported format (BMP, text, …)           | `ImagePreprocessor::isEncodedImage` (C++)     | `StatusError(InvalidArgument)` — "Unsupported image format: expected JPEG or PNG …" |
+| Corrupted JPEG / PNG                        | `ImagePreprocessor::decodeToRgb` (C++)        | `StatusError(InvalidArgument)` surfaced as JS `Error` |
+| Raw bytes + missing one of width/height/channels | `AddonJs::runJob` (C++)                  | `StatusError(InvalidArgument)` — "Raw RGB input requires all of 'width', 'height', and 'channels' …" |
+| Raw bytes + non-positive width / height     | `AddonJs::runJob` (C++)                       | `StatusError(InvalidArgument)` — "must be a positive integer when passing raw RGB bytes" |
+| Raw bytes + channels ≠ 3                    | `AddonJs::runJob` (C++)                       | `StatusError(InvalidArgument)` — "must be exactly 3 (RGB) when passing raw RGB bytes" |
+| Buffer size mismatch (raw input)            | `ImagePreprocessor::validateRawRgb` (C++)     | `StatusError(InvalidArgument)` |
+| `topK ≤ 0` when provided                    | `AddonJs::runJob` (C++)                       | `StatusError(InvalidArgument)` — "must be a positive integer when provided" |
+| Missing `config.backendsDir` on Android     | `ClassificationModel::load` (C++, Android)    | `StatusError(InvalidArgument)` — "Configuration 'config.backendsDir' is required on Android"; `index.js` defaults it to `path.join(__dirname, 'prebuilds')` so this only fires when the addon is wired up by hand |
+| GGML CPU backend variant init failure       | `ClassificationModel::load` (C++, Android)    | `StatusError(InternalError)` — "Failed to find/init CPU backend device"; raised when `ggml_backend_load_all_from_path` couldn't enumerate any per-microarch variant under `<backendsDir>/<BACKENDS_SUBDIR>/` |
+| `classify` before `load`                    | `ImageClassifier._classifyInternal` (JS)      | `Error("Classifier not loaded. Call load() first.")` |
+| `classify` after `unload`                   | `ImageClassifier._classifyInternal` (JS)      | same |
+| `unload` mid-classify                       | `ImageClassifier.unload` (JS)                 | the in-flight `classify()` promise rejects with `Error("Model was unloaded")` |
+| GGUF weights file missing                   | `ImageClassifier._load` (JS)                  | `Error("MobileNet GGUF weights not found at: …")` |
+| GGUF `mobilenet.num_classes` mismatch       | `MobileNetGraph::loadWeights` (C++)           | `StatusError(InvalidArgument)` — "does not match the addon's compiled-in class count" |
+| Compute graph output shape mismatch         | `MobileNetGraph::buildGraph` (C++)            | `StatusError(InternalError)` — defence-in-depth, never seen in practice |
+| `ggml_backend_graph_compute` non-success    | `ClassificationModel::process` (C++)          | `StatusError(InternalError)` |
+
+All errors are wrapped by the existing `qvac-lib-inference-addon-cpp`
+error infrastructure and reach the caller as structured JS Errors. Native
+code never aborts on bad input — this is validated by the error-case
+integration tests in `test/integration/error-cases.test.js` and by the
+preprocessor / model unit tests in `test/unit/*.cpp`.
+
+## Lifecycle
+
+```
+new ImageClassifier()
+        │
+        │ .load()
+        ▼
+┌──────────────────────────────────────────────┐
+│ ClassificationModel::load                    │
+│   backend init:                              │
+│     desktop  : ggml_backend_cpu_init()       │
+│     android  : ggml_backend_load_all_from_   │
+│                  path(<backendsDir>/<sub>) → │
+│                ggml_backend_dev_by_type(CPU) │
+│                  → ggml_backend_dev_init     │
+│   weights = loadWeights(gguf, backend)       │
+│   graph   = buildGraph(weights, backend)     │
+│   loaded  = true                             │
+└────────┬─────────────────────────────────────┘
+         │  many .classify(…) calls — pixel data only per-call
+         │
+         │ .unload()
+         ▼
+┌───────────────────────┐
+│ destroyInstance()     │
+│   ~AddonJs → ~AddonCpp│
+│   ~ClassificationModel│
+│   ggml_backend_free   │
+└───────────────────────┘
+```
+
+Repeated load/unload cycles do not leak native handles — validated by
+`error-cases.test.js: load -> unload -> load cycles do not leak handles`.
diff --git a/packages/classification-ggml/docs/onnx-to-gguf-conversion.md b/packages/classification-ggml/docs/onnx-to-gguf-conversion.md
new file mode 100644
index 0000000000..d4ae4c6a8d
--- /dev/null
+++ b/packages/classification-ggml/docs/onnx-to-gguf-conversion.md
@@ -0,0 +1,167 @@
+# ONNX to GGUF Conversion (Public-safe)
+
+This document describes a public-safe conversion workflow for preparing
+MobileNetV3-Small weights for this addon.
+
+## 1) Export PyTorch to ONNX
+
+- Freeze model in eval mode.
+- Fold BatchNorm where practical.
+- Export with fixed input shape `1x3x224x224`.
+
+## 2) Convert ONNX tensors into GGUF
+
+- Write tensor weights into a GGUF container.
+- Store model labels in metadata (`mobilenet.class_*` keys).
+- Use FP16 for shipped runtime weights.
+
+## 3) Verify numerics internally
+
+- Compare ONNX and GGUF runtime logits on a private validation corpus.
+- Ensure argmax agreement and tight per-logit tolerance.
+
+## 4) Integrate with addon
+
+- Replace `weights/mobilenetv3_3class_v3_fp16.gguf`.
+- Keep API output unchanged (`[{ label, confidence }]`).
+
+## Known pitfalls
+
+- BatchNorm epsilon must match training/export settings.
+- Depthwise conv paths require exact tensor shape/layout wiring.
+- Aggressive quantization can degrade CNN quality.
+# Converting a MobileNetV3-Small model to the GGUF format used by this addon
+
+This guide describes how to convert a retrained (or freshly exported)
+MobileNetV3-Small PyTorch model into the GGUF container consumed by
+`@qvac/classification-ggml`. It is intentionally minimal — the graph
+construction in `MobileNetGraph.cpp` is parameterised only by the block
+table `kBlocks` and the label metadata inside the GGUF, so swapping in
+new classes (or a different fine-tune) does not require any C++ changes
+as long as the architecture stays MobileNetV3-Small.
+
+> The bundled weights in `weights/mobilenetv3_3class_v3_fp16.gguf` were
+> produced by this exact pipeline. FP16 is numerically identical to the
+> ONNX FP32 reference on representative inputs.
+
+## 1. Export from PyTorch to ONNX
+
+```python
+import torch
+from torchvision.models import mobilenet_v3_small
+
+model = mobilenet_v3_small(weights=None)
+# Replace the 1000-class head with an N-class head that matches your target classes.
+model.classifier[3] = torch.nn.Linear(1024, NUM_CLASSES)
+model.load_state_dict(torch.load("your_finetuned_weights.pth"))
+model.eval()
+
+dummy = torch.randn(1, 3, 224, 224)
+torch.onnx.export(
+    model,
+    dummy,
+    "mobilenetv3_small.onnx",
+    input_names=["input"],
+    output_names=["logits"],
+    opset_version=17,
+)
+```
+
+Notes:
+
+- Export the model in **inference mode**. `model.eval()` is mandatory:
+  it puts BatchNorm into running-statistics mode.
+- Do **not** fold BatchNorm into conv at ONNX export time. This addon
+  folds BN at load time inside the C++ code using the GGUF-supplied
+  `running_mean`, `running_var`, `weight`, `bias` — it needs the raw
+  BN parameters to exist in the file.
+
+## 2. Convert ONNX weights to GGUF
+
+The conversion script used for the bundled model produces a GGUF with
+the torchvision tensor naming preserved verbatim (`features.0.0.weight`,
+`features.1.block.0.0.weight`, …, `classifier.3.bias`). Any converter
+that emits the same tensor names and the required metadata keys works.
+
+Required GGUF **tensor layout**:
+
+- Conv kernels: `[KW, KH, IC, OC]` (ggml convention, matches
+  `torch.Tensor` export when dims are reversed).
+- Depthwise conv kernels: `[KW, KH, 1, C]`.
+- SE `fc1` / `fc2`: `[1, 1, IC, OC]` (1×1 convs, not Linear).
+- Classifier `classifier.0.weight`: `[576, 1024]`. 
+- Classifier `classifier.3.weight`: `[1024, NUM_CLASSES]`.
+- BN tensors (`weight`, `bias`, `running_mean`, `running_var`): `[C]`
+  1-D. `num_batches_tracked` is accepted but ignored.
+
+Required GGUF **metadata keys**:
+
+| Key | Type | Example |
+|-----|------|---------|
+| `general.architecture` | string | `"mobilenetv3-small"` |
+| `general.description` | string | `"MobileNetV3-Small 3-class FP16"` |
+| `mobilenet.architecture` | string | `"mobilenetv3_small"` |
+| `mobilenet.num_classes` | uint32 | `3` |
+| `mobilenet.image_size` | uint32 | `224` |
+| `mobilenet.class_0` | string | `"food"` |
+| `mobilenet.class_1` | string | `"report"` |
+| `mobilenet.class_2` | string | `"other"` |
+| `mobilenet.mean_r/g/b` | float32 | `0.485 / 0.456 / 0.406` |
+| `mobilenet.std_r/g/b` | float32 | `0.229 / 0.224 / 0.225` |
+| `mobilenet.bn_eps` | float32 | **`0.001`** (required — see below) |
+| `mobilenet.precision` | string | `"fp16"` or `"fp32"` |
+
+Quantization choice:
+
+- **FP16** is the target for shipping; FP16 produces numerically
+  identical predictions to the FP32 reference on representative inputs.
+- **FP32** is supported for debugging. Twice the file size, same output.
+- **INT8 / Q4_0 are destructive** for MobileNetV3-Small because
+  depthwise convolutions have only 9–25 weights per channel. Sub-8-bit
+  quantization introduces unacceptable error on these layers. Do not
+  ship quantized variants.
+
+## 3. Verify numerical equivalence
+
+Run the C++ addon against your internal set of reference images and
+compare logits to the ONNX reference:
+
+```
+| logit_difference | < 1e-4 per class, FP32
+| argmax agreement | must match the ONNX reference on every image
+```
+
+`test/integration/classify.test.js` and
+`test/unit/classification_model_test.cpp` cover the shape contract and
+the per-image argmax on the 6 public sample images shipped in
+`test/images/`. The per-image logit-diff check against ONNX is done
+with an external script during development (not bundled in this
+package because it requires PyTorch / onnxruntime) and must not embed
+any private validation data into the public package.
+
+## 4. Update the bundled weights
+
+1. Place the new `.gguf` in `packages/classification-ggml/weights/`.
+2. Keep the filename identical (`mobilenetv3_3class_v3_fp16.gguf`) or
+   update `DEFAULT_WEIGHTS_FILENAME` in `index.js`.
+3. Bump the package version (`package.json` + `CHANGELOG.md`).
+4. Re-run `npm run test:integration` and `npm run test:cpp`.
+
+## 5. Supporting a new block table (advanced)
+
+If you switch to a different MobileNet variant (V3-Large, V4, etc.),
+update `kBlocks` in `MobileNetGraph.hpp` to reflect the new
+expand/project channels, kernel sizes, strides, SE reducer sizes,
+and HardSwish/ReLU flags. The graph construction loop iterates over
+`kBlocks`; no other change is required as long as the GGUF tensor
+naming follows `features.<N>.block.<idx>.*` conventions.
+
+## Known pitfalls
+
+| Pitfall | Symptom | Fix |
+|---------|---------|-----|
+| BN epsilon `= 1e-5` instead of `0.001` | Normalisation drift accumulated across 34 layers, observable class flips on representative images | Store `0.001` in `mobilenet.bn_eps` |
+| DW kernel as `[K, K, C, 1]` | `ggml_conv_2d_dw` asserts | Re-pack to `[K, K, 1, C]` |
+| Missing SE biases | First-class crashes | Always export `fc1.bias` / `fc2.bias` even if zero |
+| Classifier weight as `[OC, IC]` instead of `[IC, OC]` | `ggml_mul_mat` mis-computes | Transpose before writing to GGUF |
+| Mixed precision (some tensors FP32, some FP16) | Works, but bigger file | Standardise on FP16 for ship |
diff --git a/packages/classification-ggml/index.d.ts b/packages/classification-ggml/index.d.ts
new file mode 100644
index 0000000000..41051a8776
--- /dev/null
+++ b/packages/classification-ggml/index.d.ts
@@ -0,0 +1,96 @@
+/**
+ * Canonical labels emitted by the bundled 3-class MobileNetV3-Small model.
+ * The trailing `string` keeps the type permissive for future fine-tunes
+ * that ship different class names via the GGUF `mobilenet.class_N`
+ * metadata, so narrowing at call sites remains additive / backward
+ * compatible.
+ */
+export type ClassificationLabel =
+  | "food"
+  | "report"
+  | "other"
+  | string;
+
+export interface ClassificationResult {
+  /** Human-readable class label, sourced from the GGUF metadata (`mobilenet.class_N`). */
+  label: ClassificationLabel;
+  /** Softmax probability in `[0, 1]`. Values across all classes sum to ≈ 1. */
+  confidence: number;
+}
+
+export interface ClassifyOptions {
+  /** If set, limits the returned list to the top-K classes. Default: all classes. */
+  topK?: number;
+  /** Width (pixels). Required when passing raw RGB bytes. */
+  width?: number;
+  /** Height (pixels). Required when passing raw RGB bytes. */
+  height?: number;
+  /** Channel count. Must be `3` when passing raw RGB bytes. */
+  channels?: 3;
+}
+
+export interface ImageClassifierLogger {
+  error?: (...args: unknown[]) => void;
+  warn?: (...args: unknown[]) => void;
+  info?: (...args: unknown[]) => void;
+  debug?: (...args: unknown[]) => void;
+  getLevel?: () => string;
+}
+
+export interface ImageClassifierOptions {
+  /**
+   * Absolute path to the FP16 GGUF weights file. Defaults to the bundled
+   * `weights/mobilenetv3_3class_v3_fp16.gguf` shipped inside this package.
+   */
+  modelPath?: string;
+  /** Optional logger compatible with `@qvac/logging`. */
+  logger?: ImageClassifierLogger;
+  /**
+   * When true, forwards native C++ log messages (`QLOG(...)` calls inside
+   * the addon) to the JS `logger`. Disabled by default: the underlying
+   * shared native logger singleton is not safe across rapid
+   * create/destroy cycles. JS-level logging (`load()` / `classify()` info
+   * lines from `index.js`) is always routed to `logger` regardless of
+   * this flag.
+   */
+  nativeLogger?: boolean;
+}
+
+export interface ImageClassifierState {
+  configLoaded: boolean;
+  destroyed: boolean;
+}
+
+/**
+ * MobileNetV3-Small 3-class image classifier backed by libggml on CPU.
+ */
+export declare class ImageClassifier {
+  constructor(opts?: ImageClassifierOptions);
+
+  readonly logger: ImageClassifierLogger;
+
+  /** Loads the model and native resources. Idempotent. */
+  load(): Promise<void>;
+
+  /**
+   * Classifies an image buffer.
+   *
+   * @param imageInput JPEG or PNG buffer, or raw RGB bytes accompanied by
+   *                   `options.width`, `options.height`, `options.channels`.
+   * @param options see `ClassifyOptions`
+   */
+  classify(
+    imageInput: Uint8Array,
+    options?: ClassifyOptions,
+  ): Promise<ClassificationResult[]>;
+
+  /** Releases native resources. Safe to call multiple times. */
+  unload(): Promise<void>;
+
+  /** Releases native resources and marks this instance as destroyed. */
+  destroy(): Promise<void>;
+
+  getState(): ImageClassifierState;
+}
+
+export default ImageClassifier;
diff --git a/packages/classification-ggml/index.js b/packages/classification-ggml/index.js
new file mode 100644
index 0000000000..18fd5fa60b
--- /dev/null
+++ b/packages/classification-ggml/index.js
@@ -0,0 +1,208 @@
+'use strict'
+
+const fs = require('bare-fs')
+const path = require('bare-path')
+const process = require('bare-process')
+const QvacLogger = require('@qvac/logging')
+const { createJobHandler, exclusiveRunQueue } = require('@qvac/infer-base')
+
+const { ClassificationInterface, mapAddonEvent } = require('./addon')
+
+const DEFAULT_WEIGHTS_FILENAME = 'mobilenetv3_3class_v3_fp16.gguf'
+const RUN_BUSY_ERROR_MESSAGE = 'Cannot set new job: a job is already set or being processed'
+
+function resolveDefaultModelPath () {
+  if (typeof process !== 'undefined' && process.env && process.env.QVAC_CLASSIFICATION_MODEL_PATH) {
+    return process.env.QVAC_CLASSIFICATION_MODEL_PATH
+  }
+  return path.join(__dirname, 'weights', DEFAULT_WEIGHTS_FILENAME)
+}
+
+/**
+ * High-level classifier for MobileNetV3-Small 3-class image triage.
+ *
+ * ```js
+ * const classifier = new ImageClassifier()
+ * await classifier.load()
+ * const result = await classifier.classify(jpegBuffer)
+ * // [ { label: 'food', confidence: 0.93 }, ... ]
+ * await classifier.unload()
+ * ```
+ */
+class ImageClassifier {
+  /**
+   * @param {Object} [opts]
+   * @param {string} [opts.modelPath] absolute path to the FP16 GGUF file. Defaults to the bundled model.
+   * @param {Object} [opts.logger] optional `@qvac/logging`-compatible logger.
+   * @param {boolean} [opts.nativeLogger=false] forward C++-side log lines through `logger`.
+   */
+  constructor (opts = {}) {
+    const { modelPath, logger = null, nativeLogger = false } = opts
+    this._modelPath = modelPath ?? resolveDefaultModelPath()
+    this.logger = new QvacLogger(logger)
+    // Off by default: see `addon.js::_ensureLoggerInstalled` for the
+    // process-wide JsLogger lifecycle that opt-in unlocks.
+    this._nativeLogger = nativeLogger === true
+    this._addon = null
+    this._job = createJobHandler({ cancel: () => this._addon?.cancel() })
+    this._run = exclusiveRunQueue()
+    this._hasActiveResponse = false
+    this.state = { configLoaded: false, destroyed: false }
+  }
+
+  getState () { return { ...this.state } }
+
+  async load () {
+    return this._run(async () => {
+      if (this.state.configLoaded) return
+      await this._load()
+      this.state.configLoaded = true
+      this.logger.info('ImageClassifier loaded')
+    })
+  }
+
+  async _load () {
+    if (!fs.existsSync(this._modelPath)) {
+      throw new Error(`MobileNet GGUF weights not found at: ${this._modelPath}`)
+    }
+
+    // configurationParams is the C++ schema 1:1 — keep it free of any
+    // JS-only flags. The native-logger gate lives in the JS-side opts arg.
+    const configurationParams = {
+      path: this._modelPath,
+      config: { backendsDir: path.join(__dirname, 'prebuilds') }
+    }
+
+    const disableNativeLogger = !this._nativeLogger ||
+      (process.env && process.env.QVAC_CLASSIFICATION_DISABLE_NATIVE_LOGGER === '1')
+
+    try {
+      this._addon = this._createAddon(configurationParams, { disableNativeLogger })
+      await this._addon.activate()
+    } catch (loadError) {
+      this.logger.error('Error during model load:', loadError)
+      try { await this._addon?.unload?.() } catch (_) {}
+      this._addon = null
+      throw loadError
+    }
+  }
+
+  _createAddon (configurationParams, opts) {
+    const binding = require('./binding')
+    return new ClassificationInterface(
+      binding,
+      configurationParams,
+      this._addonOutputCallback.bind(this),
+      this.logger,
+      opts
+    )
+  }
+
+  /**
+   * Classifies one image.
+   *
+   * @param {Uint8Array} imageInput JPEG/PNG buffer, or raw RGB bytes with
+   *                                `options.width`, `options.height`, `options.channels=3`.
+   * @param {Object} [options]
+   * @param {number} [options.topK]    limit the number of returned classes
+   * @param {number} [options.width]   raw RGB width (required for raw input)
+   * @param {number} [options.height]  raw RGB height (required for raw input)
+   * @param {number} [options.channels] raw RGB channel count (must be 3)
+   * @returns {Promise<Array<{label: string, confidence: number}>>}
+   *          sorted by `confidence` descending. Always returns all classes
+   *          unless `options.topK` is set.
+   */
+  async classify (imageInput, options = undefined) {
+    return this._run(() => this._classifyInternal(imageInput, options))
+  }
+
+  async _classifyInternal (imageInput, options) {
+    if (!this._addon || !this.state.configLoaded) {
+      throw new Error('Classifier not loaded. Call load() first.')
+    }
+    if (this._hasActiveResponse) {
+      throw new Error(RUN_BUSY_ERROR_MESSAGE)
+    }
+
+    const job = { type: 'image', content: imageInput }
+    if (options) {
+      if (options.width !== undefined) job.width = options.width
+      if (options.height !== undefined) job.height = options.height
+      if (options.channels !== undefined) job.channels = options.channels
+      if (options.topK !== undefined) job.topK = options.topK
+    }
+
+    const response = this._job.start()
+
+    let accepted
+    try {
+      accepted = await this._addon.runJob(job)
+    } catch (err) {
+      this._job.fail(err)
+      throw err
+    }
+    if (!accepted) {
+      const err = new Error('Classification job was rejected by the native runner')
+      this._job.fail(err)
+      throw err
+    }
+
+    this._hasActiveResponse = true
+    const collected = await response.await().finally(() => {
+      this._hasActiveResponse = false
+    })
+    // QvacResponse collects each Output event into an array; classify
+    // emits exactly one, so unwrap to preserve the public shape.
+    return Array.isArray(collected) && Array.isArray(collected[0])
+      ? collected[0]
+      : collected
+  }
+
+  _handleAddonOutputEvent (eventType, data, error) {
+    if (eventType === 'LogMsg') {
+      const msg = typeof data === 'string' ? data : (data?.message || JSON.stringify(data))
+      this.logger?.info?.(msg)
+      return
+    }
+    if (eventType === 'Error') {
+      const err = error instanceof Error
+        ? error
+        : new Error((error && error.message) || (typeof error === 'string' ? error : 'Classification failed'))
+      this._job.fail(err)
+    } else if (eventType === 'Output') {
+      this._job.output(data)
+    } else if (eventType === 'JobEnded') {
+      this._job.end()
+    }
+  }
+
+  _addonOutputCallback (addon, event, data, error) {
+    const mapped = mapAddonEvent(event, data, error)
+    if (mapped === null) return
+    this._handleAddonOutputEvent(mapped.type, mapped.data, mapped.error)
+  }
+
+  /** Idempotent. Cancels any in-flight job before destroying the handle. */
+  async unload () {
+    return this._run(async () => {
+      try { if (this._addon?.cancel) await this._addon.cancel() } catch (_) {}
+      if (this._job.active) {
+        this._job.fail(new Error('Model was unloaded'))
+      }
+      this._hasActiveResponse = false
+      if (this._addon) {
+        await this._addon.unload()
+        this._addon = null
+      }
+      this.state.configLoaded = false
+    })
+  }
+
+  async destroy () {
+    await this.unload()
+    this.state.destroyed = true
+  }
+}
+
+module.exports = ImageClassifier
+module.exports.ImageClassifier = ImageClassifier
diff --git a/packages/classification-ggml/package.json b/packages/classification-ggml/package.json
new file mode 100644
index 0000000000..cb46086452
--- /dev/null
+++ b/packages/classification-ggml/package.json
@@ -0,0 +1,88 @@
+{
+  "name": "@qvac/classification-ggml",
+  "version": "0.1.0",
+  "description": "GGML image classification addon for QVAC (MobileNetV3-Small CPU inference)",
+  "addon": true,
+  "scripts": {
+    "build": "bare-make generate && bare-make build && bare-make install",
+    "build:pack": "mkdir -p dist && npm pack --pack-destination dist",
+    "mobile:copy-prebuilds": "node ./scripts/copy-mobile-test-assets.js",
+    "lint": "standard --ignore \"addon/**\"",
+    "lint:fix": "standard --ignore \"addon/**\" --fix",
+    "lint-cpp": "clang-tidy -p build addon/src/js-interface/binding.cpp addon/src/model-interface/ClassificationModel.cpp addon/src/model-interface/ImagePreprocessor.cpp addon/src/model-interface/MobileNetGraph.cpp",
+    "test": "npm run test:integration",
+    "test:unit:generate": "brittle -r test/unit/all.js test/unit/*.test.js",
+    "test:unit": "npm run test:unit:generate && bare test/unit/all.js --exit",
+    "test:integration": "npm run test:integration:generate && bare test/integration/all.js --exit",
+    "test:integration:generate": "brittle -r test/integration/all.js test/integration/*.test.js && npm run test:mobile:generate",
+    "test:mobile:generate": "bare ./scripts/generate-mobile-integration-tests.js",
+    "test:mobile:validate": "node scripts/validate-mobile-tests.js",
+    "test:cpp:build": "bare-make generate -D BUILD_TESTING=ON && bare-make build --target addon-test",
+    "test:cpp:run": "node scripts/run-cpp-tests.js",
+    "test:cpp": "npm run test:cpp:build && npm run test:cpp:run",
+    "test:dts": "tsc -p tsconfig.dts.json",
+    "test:all": "npm run test:unit && npm run test:integration && npm run test:cpp"
+  },
+  "standard": {
+    "ignore": [
+      "addon/**",
+      "third-party/**",
+      "prebuilds/**",
+      "build/**",
+      "test/mobile/integration.auto.cjs"
+    ]
+  },
+  "files": [
+    "binding.js",
+    "index.js",
+    "addon.js",
+    "index.d.ts",
+    "prebuilds",
+    "weights",
+    "test/mobile",
+    "test/integration",
+    "test/images",
+    "LICENSE",
+    "NOTICE",
+    "README.md"
+  ],
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/tetherto/qvac.git",
+    "directory": "packages/classification-ggml"
+  },
+  "author": "Tether",
+  "license": "Apache-2.0",
+  "bugs": "https://github.com/tetherto/qvac/issues",
+  "homepage": "https://github.com/tetherto/qvac/tree/main/packages/classification-ggml#readme",
+  "devDependencies": {
+    "@types/node": "^24.2.1",
+    "bare-url": "^2.1.6",
+    "brittle": "^3.16.5",
+    "cmake-bare": "1.7.5",
+    "cmake-vcpkg": "^1.1.0",
+    "standard": "^17.0.0",
+    "typescript": "^5.9.2"
+  },
+  "dependencies": {
+    "@qvac/infer-base": "^0.4.0",
+    "@qvac/logging": "^0.1.0",
+    "bare-fs": "^4.5.1",
+    "bare-path": "^3.0.0",
+    "bare-process": "^4.2.2"
+  },
+  "engines": {
+    "bare": ">=1.24.0"
+  },
+  "peerDependencies": {},
+  "exports": {
+    "./package": "./package.json",
+    ".": {
+      "types": "./index.d.ts",
+      "default": "./index.js"
+    },
+    "./addon.js": "./addon.js",
+    "./binding.js": "./binding.js"
+  },
+  "types": "index.d.ts"
+}
diff --git a/packages/classification-ggml/scripts/copy-mobile-test-assets.js b/packages/classification-ggml/scripts/copy-mobile-test-assets.js
new file mode 100644
index 0000000000..d81d757094
--- /dev/null
+++ b/packages/classification-ggml/scripts/copy-mobile-test-assets.js
@@ -0,0 +1,166 @@
+#!/usr/bin/env node
+'use strict'
+
+// Prepare prebuilds and test assets for the on-device mobile test framework.
+//
+// Two responsibilities:
+//
+//   1. Replicate the single arm64 native prebuild we ship across the
+//      additional `<platform>-<arch>` directory names that the mobile
+//      test framework expects to find under `prebuilds/`. Without these
+//      copies the framework cannot match a native binary for the device
+//      arch flavour it is targeting (e.g. android-x64, ios-arm64-simulator).
+//
+//   2. Copy the FP16 GGUF weights bundle from `weights/` into
+//      `test/mobile/testAssets/`. On mobile, the bare runtime cannot
+//      access files in the npm package's `weights/` directory at runtime
+//      because the worklet is loaded from a packed `.bundle`; the test
+//      framework instead pushes everything under `test/mobile/testAssets/`
+//      to the device and exposes their on-device paths via
+//      `global.assetPaths`. Without this copy `ImageClassifier.load()`
+//      fails with `MobileNet GGUF weights not found at /app.bundle/...`.
+//
+// Idempotent: every action is a copy that overwrites silently if the
+// destination already exists.
+
+const fs = require('fs')
+const path = require('path')
+
+const ADDON_DIR = path.resolve(__dirname, '..')
+const PREBUILDS_DIR = path.join(ADDON_DIR, 'prebuilds')
+const WEIGHTS_DIR = path.join(ADDON_DIR, 'weights')
+const TEST_ASSETS_DIR = path.join(ADDON_DIR, 'test', 'mobile', 'testAssets')
+const TEST_IMAGES_DIR = path.join(ADDON_DIR, 'test', 'images')
+
+// The qvac-test-addon-mobile framework's metro.config.js registers
+// `assetExts: ['so', 'bin', 'model', 'bundle', 'raw', 'onnx']`. It does
+// NOT include `.gguf`, so a file with that extension placed under
+// `testAssets/` is treated by the React Native bundler as a JS-source
+// request and the on-device build aborts with
+//   `Unable to resolve module ../assets/testAssets/<file>.gguf`
+// at the `:app:createBundleReleaseJsAndAssets` step (see CI run
+// 25002820522). We work around this by copying the GGUF blob with a
+// `.bin` suffix appended -- `.bin` is in the framework's accepted
+// list, the bundler treats it as a binary asset, and the file is
+// pushed to the device verbatim. ggml's `gguf_init_from_file` reads
+// by path and parses the GGUF magic bytes; it does not validate the
+// file extension, so the rename is purely a packaging detail.
+//
+// The pair below is `[<source filename in weights/>, <destination
+// filename in test/mobile/testAssets/>]`. `resolveModelPath()` in
+// `test/integration/utils.js` looks up the destination filename when
+// running on mobile.
+const WEIGHT_FILES = [
+  ['mobilenetv3_3class_v3_fp16.gguf', 'mobilenetv3_3class_v3_fp16.gguf.bin']
+]
+
+const ANDROID_FLAVOURS = ['android-arm64', 'android-arm', 'android-ia32', 'android-x64']
+const IOS_FLAVOURS = ['ios-arm64', 'ios-arm64-simulator', 'ios-x64-simulator']
+
+function copyDirRecursive (src, dst) {
+  if (!fs.existsSync(src)) return false
+  fs.mkdirSync(dst, { recursive: true })
+  for (const entry of fs.readdirSync(src, { withFileTypes: true })) {
+    const sChild = path.join(src, entry.name)
+    const dChild = path.join(dst, entry.name)
+    if (entry.isDirectory()) {
+      copyDirRecursive(sChild, dChild)
+    } else if (entry.isFile()) {
+      fs.copyFileSync(sChild, dChild)
+    }
+  }
+  return true
+}
+
+function fanOutPrebuilds (sourceFlavour, allFlavours) {
+  const sourceDir = path.join(PREBUILDS_DIR, sourceFlavour)
+  if (!fs.existsSync(sourceDir)) {
+    console.log(`[mobile:copy-prebuilds] Source prebuilds not found: ${sourceDir}; skipping fan-out for ${allFlavours.join(', ')}`)
+    return
+  }
+  for (const target of allFlavours) {
+    if (target === sourceFlavour) continue
+    const targetDir = path.join(PREBUILDS_DIR, target)
+    if (fs.existsSync(targetDir)) {
+      console.log(`[mobile:copy-prebuilds] ${target} already present, leaving as-is`)
+      continue
+    }
+    if (copyDirRecursive(sourceDir, targetDir)) {
+      console.log(`[mobile:copy-prebuilds] Copied ${sourceFlavour} -> ${target}`)
+    }
+  }
+}
+
+// Copy every classification test image (`test/images/*.{jpg,jpeg,png}`)
+// into `test/mobile/testAssets/`. The qvac-test-addon-mobile framework
+// pushes everything under `test/mobile/testAssets/` to the device and
+// exposes their on-device paths through `global.assetPaths`, keyed by
+// `../../testAssets/<filename>`. Without this copy `loadImage()` in
+// `test/integration/utils.js` falls back to a desktop-style fs lookup
+// inside the packed `app.bundle/` (which is not a real filesystem) and
+// the bare runtime aborts with `FileError: ENOENT, open
+// "/app.bundle/backend/test/images/<file>"`. Image extensions
+// (`.jpg`/`.png`) are part of React Native's default `assetExts`, so
+// no rename is required (unlike the GGUF blob).
+function copyTestImagesToTestAssets () {
+  if (!fs.existsSync(TEST_IMAGES_DIR)) {
+    console.error(`[mobile:copy-prebuilds] FATAL: test images directory not found: ${TEST_IMAGES_DIR}`)
+    console.error('[mobile:copy-prebuilds] The integration test images must be present before mobile tests can run.')
+    process.exit(1)
+  }
+  fs.mkdirSync(TEST_ASSETS_DIR, { recursive: true })
+  const allowedExts = new Set(['.jpg', '.jpeg', '.png'])
+  let copied = 0
+  for (const entry of fs.readdirSync(TEST_IMAGES_DIR, { withFileTypes: true })) {
+    if (!entry.isFile()) continue
+    const ext = path.extname(entry.name).toLowerCase()
+    if (!allowedExts.has(ext)) continue
+    const src = path.join(TEST_IMAGES_DIR, entry.name)
+    const dst = path.join(TEST_ASSETS_DIR, entry.name)
+    fs.copyFileSync(src, dst)
+    const sizeKb = (fs.statSync(dst).size / 1024).toFixed(1)
+    console.log(`[mobile:copy-prebuilds] Copied test image ${entry.name} -> ${path.relative(ADDON_DIR, dst)} (${sizeKb} KB)`)
+    copied++
+  }
+  if (copied === 0) {
+    console.error(`[mobile:copy-prebuilds] FATAL: no test images were found in ${TEST_IMAGES_DIR}`)
+    process.exit(1)
+  }
+}
+
+function copyWeightsToTestAssets () {
+  if (!fs.existsSync(WEIGHTS_DIR)) {
+    console.error(`[mobile:copy-prebuilds] FATAL: weights directory not found: ${WEIGHTS_DIR}`)
+    console.error('[mobile:copy-prebuilds] The bundled GGUF model must be present before mobile tests can run.')
+    process.exit(1)
+  }
+  fs.mkdirSync(TEST_ASSETS_DIR, { recursive: true })
+  let copied = 0
+  for (const [srcName, dstName] of WEIGHT_FILES) {
+    const src = path.join(WEIGHTS_DIR, srcName)
+    const dst = path.join(TEST_ASSETS_DIR, dstName)
+    if (!fs.existsSync(src)) {
+      console.error(`[mobile:copy-prebuilds] FATAL: required weights file missing: ${src}`)
+      process.exit(1)
+    }
+    fs.copyFileSync(src, dst)
+    const sizeMb = (fs.statSync(dst).size / 1024 / 1024).toFixed(1)
+    console.log(`[mobile:copy-prebuilds] Copied weights ${srcName} -> ${path.relative(ADDON_DIR, dst)} (${sizeMb} MB)`)
+    copied++
+  }
+  if (copied === 0) {
+    console.error('[mobile:copy-prebuilds] FATAL: no weight files were copied')
+    process.exit(1)
+  }
+}
+
+function main () {
+  console.log(`[mobile:copy-prebuilds] Preparing mobile assets in ${ADDON_DIR}`)
+  fanOutPrebuilds('android-arm64', ANDROID_FLAVOURS)
+  fanOutPrebuilds('ios-arm64', IOS_FLAVOURS)
+  copyWeightsToTestAssets()
+  copyTestImagesToTestAssets()
+  console.log('[mobile:copy-prebuilds] Done.')
+}
+
+main()
diff --git a/packages/classification-ggml/scripts/generate-mobile-integration-tests.js b/packages/classification-ggml/scripts/generate-mobile-integration-tests.js
new file mode 100644
index 0000000000..4d989dadf4
--- /dev/null
+++ b/packages/classification-ggml/scripts/generate-mobile-integration-tests.js
@@ -0,0 +1,75 @@
+'use strict'
+
+// Scans test/integration for *.test.js files and generates a mobile
+// wrapper at test/mobile/integration.auto.cjs. Each generated wrapper
+// function loads one integration test module via the shared mobile
+// integration runtime so the mobile test framework (qvac-test-addon-mobile)
+// can invoke them individually. Matches the pattern used by the other
+// QVAC inference addons (nmtcpp, diffusion, llamacpp-*).
+
+const fs = require('bare-fs')
+const path = require('bare-path')
+
+const repoRoot = path.resolve(__dirname, '..')
+const integrationDir = path.join(repoRoot, 'test', 'integration')
+const mobileDir = path.join(repoRoot, 'test', 'mobile')
+const outputFile = path.join(mobileDir, 'integration.auto.cjs')
+
+function getIntegrationFiles () {
+  if (!fs.existsSync(integrationDir)) {
+    throw new Error(`Integration directory not found: ${integrationDir}`)
+  }
+
+  return fs.readdirSync(integrationDir)
+    .filter(entry => entry.endsWith('.test.js'))
+    .sort()
+}
+
+function toFunctionName (fileName) {
+  const base = fileName.replace(/\.test\.js$/, '')
+  const parts = base.split(/[^a-zA-Z0-9]+/).filter(Boolean)
+  const suffix = parts.map(part => part.charAt(0).toUpperCase() + part.slice(1)).join('')
+  return `run${suffix}`
+}
+
+function buildFileContents (files) {
+  const lines = []
+  lines.push("'use strict'")
+  lines.push("require('./integration-runtime.cjs')")
+  lines.push('')
+  lines.push('/* global runIntegrationModule */')
+  lines.push('')
+
+  for (let i = 0; i < files.length; i++) {
+    const file = files[i]
+    const fnName = toFunctionName(file)
+    const relativePath = `../integration/${file}`
+    lines.push(`async function ${fnName} (options = {}) { // eslint-disable-line no-unused-vars`)
+    lines.push(`  return runIntegrationModule('${relativePath}', options)`)
+    lines.push('}')
+    if (i < files.length - 1) {
+      lines.push('')
+    }
+  }
+
+  return `${lines.join('\n')}\n`
+}
+
+function main () {
+  if (!fs.existsSync(mobileDir)) {
+    fs.mkdirSync(mobileDir, { recursive: true })
+  }
+
+  const files = getIntegrationFiles()
+  if (files.length === 0) {
+    throw new Error(`No integration test files found inside ${integrationDir}`)
+  }
+
+  const content = buildFileContents(files)
+  fs.writeFileSync(outputFile, content, 'utf8')
+  console.log(`Generated ${outputFile} with ${files.length} integration runners.`)
+}
+
+if (require.main === module) {
+  main()
+}
diff --git a/packages/classification-ggml/scripts/run-cpp-tests.js b/packages/classification-ggml/scripts/run-cpp-tests.js
new file mode 100644
index 0000000000..2e56e31f50
--- /dev/null
+++ b/packages/classification-ggml/scripts/run-cpp-tests.js
@@ -0,0 +1,20 @@
+'use strict'
+
+const path = require('path')
+const os = require('os')
+const { spawnSync } = require('child_process')
+
+const binary = os.platform() === 'win32' ? 'addon-test.exe' : './addon-test'
+const cwd = path.resolve(__dirname, '..', 'build', 'test', 'unit')
+
+const result = spawnSync(binary, ['--gtest_output=xml:cpp-test-results.xml'], {
+  cwd,
+  stdio: 'inherit',
+  shell: false
+})
+
+if (result.error) {
+  throw result.error
+}
+
+process.exit(result.status || 0)
diff --git a/packages/classification-ggml/scripts/validate-mobile-tests.js b/packages/classification-ggml/scripts/validate-mobile-tests.js
new file mode 100644
index 0000000000..4cc958990b
--- /dev/null
+++ b/packages/classification-ggml/scripts/validate-mobile-tests.js
@@ -0,0 +1,44 @@
+'use strict'
+
+// Node-side (not Bare) structural validator for the mobile test layout.
+// Used by CI to fail early if the generator hasn't been run or the mobile
+// runtime helper is missing. Mirrors the pattern used by the other QVAC
+// inference addons (nmtcpp, diffusion, llamacpp-*).
+
+const fs = require('fs')
+const path = require('path')
+const process = require('process')
+
+const repoRoot = path.resolve(__dirname, '..')
+const mobileDir = path.join(repoRoot, 'test', 'mobile')
+const autoFile = path.join(mobileDir, 'integration.auto.cjs')
+const runtimeFile = path.join(mobileDir, 'integration-runtime.cjs')
+
+function main () {
+  const errors = []
+
+  if (!fs.existsSync(mobileDir)) {
+    errors.push(`Mobile test directory not found: ${mobileDir}`)
+  }
+
+  if (!fs.existsSync(autoFile)) {
+    errors.push(`Auto-generated file not found: ${autoFile}`)
+    errors.push('Run `npm run test:mobile:generate` to create it')
+  }
+
+  if (!fs.existsSync(runtimeFile)) {
+    errors.push(`Runtime file not found: ${runtimeFile}`)
+  }
+
+  if (errors.length > 0) {
+    console.error('Mobile test validation failed:')
+    errors.forEach(err => console.error('  -', err))
+    process.exit(1)
+  }
+
+  console.log('Mobile test structure is valid')
+}
+
+if (require.main === module) {
+  main()
+}
diff --git a/packages/classification-ggml/test/images/meal_1.jpg b/packages/classification-ggml/test/images/meal_1.jpg
new file mode 100644
index 0000000000..024356989a
Binary files /dev/null and b/packages/classification-ggml/test/images/meal_1.jpg differ
diff --git a/packages/classification-ggml/test/images/meal_2.jpg b/packages/classification-ggml/test/images/meal_2.jpg
new file mode 100644
index 0000000000..3be14c6f68
Binary files /dev/null and b/packages/classification-ggml/test/images/meal_2.jpg differ
diff --git a/packages/classification-ggml/test/images/other_1.jpg b/packages/classification-ggml/test/images/other_1.jpg
new file mode 100644
index 0000000000..69bc7f479f
Binary files /dev/null and b/packages/classification-ggml/test/images/other_1.jpg differ
diff --git a/packages/classification-ggml/test/images/other_2.jpg b/packages/classification-ggml/test/images/other_2.jpg
new file mode 100644
index 0000000000..e3efef595c
Binary files /dev/null and b/packages/classification-ggml/test/images/other_2.jpg differ
diff --git a/packages/classification-ggml/test/images/report_1.jpg b/packages/classification-ggml/test/images/report_1.jpg
new file mode 100644
index 0000000000..15d2048fa7
Binary files /dev/null and b/packages/classification-ggml/test/images/report_1.jpg differ
diff --git a/packages/classification-ggml/test/images/report_2.jpg b/packages/classification-ggml/test/images/report_2.jpg
new file mode 100644
index 0000000000..e4da1b697a
Binary files /dev/null and b/packages/classification-ggml/test/images/report_2.jpg differ
diff --git a/packages/classification-ggml/test/integration/all.js b/packages/classification-ggml/test/integration/all.js
new file mode 100644
index 0000000000..4cd0002081
--- /dev/null
+++ b/packages/classification-ggml/test/integration/all.js
@@ -0,0 +1,14 @@
+// This runner is auto-generated by Brittle
+
+runTests()
+
+async function runTests () {
+  const test = (await import('brittle')).default
+
+  test.pause()
+
+  await import('./classify.test.js')
+  await import('./error-cases.test.js')
+
+  test.resume()
+}
diff --git a/packages/classification-ggml/test/integration/classify.test.js b/packages/classification-ggml/test/integration/classify.test.js
new file mode 100644
index 0000000000..2cb16766e5
--- /dev/null
+++ b/packages/classification-ggml/test/integration/classify.test.js
@@ -0,0 +1,157 @@
+'use strict'
+
+const test = require('brittle')
+
+const {
+  IMAGE_SAMPLES,
+  loadImage,
+  TEST_TIMEOUT,
+  recordMetric,
+  recordLoadTime,
+  makeClassifier,
+  cleanupClassifier
+} = require('./utils')
+
+test('load() + classify() returns a shaped result for every sample image', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  const loadStart = Date.now()
+  await classifier.load()
+  const loadElapsed = Date.now() - loadStart
+  recordLoadTime('load:cold', loadElapsed)
+  try {
+    for (const sample of IMAGE_SAMPLES) {
+      const buffer = loadImage(sample.file)
+      const start = Date.now()
+      const result = await classifier.classify(buffer)
+      const elapsed = Date.now() - start
+
+      // Always emit the full result into the TAP stream so CI logs
+      // contain the actual model output for every platform, even on
+      // success. When an assertion fails (e.g. the win32 CI meal_1
+      // anomaly), this line is what lets us diagnose without needing
+      // to add instrumentation in a follow-up commit.
+      t.comment(
+        `${sample.file} elapsed=${elapsed}ms result=` +
+        JSON.stringify(
+          Array.isArray(result)
+            ? result.map((r) => ({
+              label: r && r.label,
+              confidence: typeof r?.confidence === 'number'
+                ? r.confidence.toFixed(6)
+                : String(r?.confidence)
+            }))
+            : result
+        )
+      )
+
+      // Shape + per-entry validity: distinguish "not a number / NaN /
+      // Inf" from "number outside [0,1]" so a future failure tells us
+      // the kind of corruption rather than just "bad value".
+      t.ok(Array.isArray(result), `${sample.file}: result is an array`)
+      t.is(result.length, 3, `${sample.file}: 3 classes returned`)
+      for (let idx = 0; idx < result.length; idx++) {
+        const entry = result[idx]
+        t.is(typeof entry.label, 'string',
+          `${sample.file}[${idx}]: label is a string`)
+        t.ok(typeof entry.confidence === 'number',
+          `${sample.file}[${idx}]: confidence is a number`)
+        t.ok(Number.isFinite(entry.confidence),
+          `${sample.file}[${idx}]: confidence is finite (not NaN/Inf)`)
+        t.ok(entry.confidence >= 0 && entry.confidence <= 1,
+          `${sample.file}[${idx}]: confidence is in [0, 1] (got ${entry.confidence})`)
+      }
+
+      // Sum-to-one guarantee from the C++ softmax. If this ever fails
+      // the diagnostic comment above tells us the per-element values.
+      const sum = result.reduce((acc, r) => acc + r.confidence, 0)
+      t.ok(Number.isFinite(sum), `${sample.file}: probability sum is finite (got ${sum})`)
+      t.ok(Math.abs(sum - 1) < 1e-3,
+        `${sample.file}: probabilities sum ≈ 1.0 (sum=${sum.toFixed(6)})`)
+
+      // Sort order. We split the two pairwise comparisons so a failure
+      // tells us which adjacent pair is misordered.
+      t.ok(result[0].confidence >= result[1].confidence,
+        `${sample.file}: sorted desc [0]>=[1] (got ${result[0].confidence.toFixed(6)} vs ${result[1].confidence.toFixed(6)})`)
+      t.ok(result[1].confidence >= result[2].confidence,
+        `${sample.file}: sorted desc [1]>=[2] (got ${result[1].confidence.toFixed(6)} vs ${result[2].confidence.toFixed(6)})`)
+
+      t.is(result[0].label, sample.expected,
+        `${sample.file}: top class should be '${sample.expected}'`)
+
+      recordMetric(`classify:${sample.file}`, elapsed, sample.file)
+    }
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('topK limits output count', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    const buffer = loadImage('meal_1.jpg')
+    const top1 = await classifier.classify(buffer, { topK: 1 })
+    t.comment(`topK=1 result=${JSON.stringify(top1)}`)
+    t.is(top1.length, 1, 'topK=1 returns exactly one entry')
+    t.ok(Number.isFinite(top1[0].confidence),
+      `topK=1 [0].confidence is finite (got ${top1[0].confidence})`)
+    t.ok(top1[0].confidence > 0,
+      `topK=1 top entry has nonzero confidence (got ${top1[0].confidence})`)
+
+    const top2 = await classifier.classify(buffer, { topK: 2 })
+    t.comment(`topK=2 result=${JSON.stringify(top2)}`)
+    t.is(top2.length, 2, 'topK=2 returns exactly two entries')
+    t.ok(Number.isFinite(top2[0].confidence) && Number.isFinite(top2[1].confidence),
+      'topK=2 both confidences are finite')
+    t.ok(top2[0].confidence >= top2[1].confidence,
+      `topK=2 sorted desc (got ${top2[0].confidence} vs ${top2[1].confidence})`)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('multiple sequential classifications produce consistent output', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    const buffer = loadImage('report_1.jpg')
+    const a = await classifier.classify(buffer)
+    const b = await classifier.classify(buffer)
+    t.comment(`a=${JSON.stringify(a)}`)
+    t.comment(`b=${JSON.stringify(b)}`)
+    t.ok(Number.isFinite(a[0].confidence) && Number.isFinite(b[0].confidence),
+      'both top confidences are finite')
+    t.is(a[0].label, b[0].label, 'top class is stable across calls')
+    t.ok(Math.abs(a[0].confidence - b[0].confidence) < 1e-5,
+      `top confidence is deterministic on CPU (a=${a[0].confidence}, b=${b[0].confidence})`)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('raw RGB bytes path', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    const width = 10
+    const height = 10
+    const channels = 3
+    const raw = Buffer.alloc(width * height * channels, 128)
+    const result = await classifier.classify(raw, { width, height, channels })
+    t.comment(`raw RGB result=${JSON.stringify(result)}`)
+    t.is(result.length, 3, 'returns all classes for raw input')
+    for (let idx = 0; idx < result.length; idx++) {
+      t.ok(Number.isFinite(result[idx].confidence),
+        `raw RGB [${idx}].confidence is finite (got ${result[idx].confidence})`)
+    }
+    const sum = result.reduce((acc, r) => acc + r.confidence, 0)
+    t.ok(Math.abs(sum - 1) < 1e-3,
+      `raw input probabilities sum ≈ 1.0 (sum=${sum.toFixed(6)})`)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
diff --git a/packages/classification-ggml/test/integration/error-cases.test.js b/packages/classification-ggml/test/integration/error-cases.test.js
new file mode 100644
index 0000000000..3504aac887
--- /dev/null
+++ b/packages/classification-ggml/test/integration/error-cases.test.js
@@ -0,0 +1,128 @@
+'use strict'
+
+const test = require('brittle')
+
+const { loadImage, TEST_TIMEOUT, makeClassifier, cleanupClassifier } = require('./utils')
+
+test('classify(null) rejects with structured error', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    await t.exception.all(() => classifier.classify(null), /required|null|undefined/i)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('classify(empty buffer) rejects', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    await t.exception.all(() => classifier.classify(Buffer.alloc(0)), /empty/i)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('classify(non-image buffer without dims) rejects', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    await t.exception.all(() => classifier.classify(Buffer.from('not an image')),
+      /unsupported|jpeg|png/i)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('classify(truncated JPEG) rejects without crashing', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    const full = loadImage('meal_1.jpg')
+    const truncated = full.slice(0, Math.min(128, full.length))
+    await t.exception.all(() => classifier.classify(truncated), /decode|corrupt|invalid|jpeg/i)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('classify(raw bytes with mismatched dimensions) rejects', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    const bad = Buffer.alloc(10 * 10 * 3, 0)
+    await t.exception.all(
+      () => classifier.classify(bad, { width: 999, height: 999, channels: 3 }),
+      /does not match|size/i
+    )
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('classify(bmp buffer) rejects as unsupported format', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    // BMP signature 'BM' followed by a minimal header.
+    const bmp = Buffer.from([0x42, 0x4D, 0x00, 0x00, 0x00, 0x00])
+    await t.exception.all(() => classifier.classify(bmp), /unsupported|jpeg|png/i)
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('classify before load() rejects', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  try {
+    await t.exception.all(
+      () => classifier.classify(loadImage('meal_1.jpg')),
+      /not loaded|load\(\)/i
+    )
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('classify after unload() rejects', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  await cleanupClassifier(classifier)
+  await t.exception.all(
+    () => classifier.classify(loadImage('meal_1.jpg')),
+    /not loaded|load\(\)/i
+  )
+})
+
+test('tiny 1x1 raw image is accepted (upscaled)', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  const classifier = makeClassifier()
+  await classifier.load()
+  try {
+    const tiny = Buffer.from([200, 150, 50])
+    const result = await classifier.classify(tiny, { width: 1, height: 1, channels: 3 })
+    t.is(result.length, 3, 'returns all classes for 1x1 upscale')
+  } finally {
+    await cleanupClassifier(classifier)
+  }
+})
+
+test('load -> unload -> load cycles do not leak handles', async function (t) {
+  t.timeout(TEST_TIMEOUT)
+  for (let i = 0; i < 3; i++) {
+    const classifier = makeClassifier()
+    await classifier.load()
+    const r = await classifier.classify(loadImage('meal_1.jpg'))
+    t.ok(Array.isArray(r), `cycle ${i}: classify works`)
+    await cleanupClassifier(classifier)
+  }
+})
diff --git a/packages/classification-ggml/test/integration/utils.js b/packages/classification-ggml/test/integration/utils.js
new file mode 100644
index 0000000000..8f798a9f23
--- /dev/null
+++ b/packages/classification-ggml/test/integration/utils.js
@@ -0,0 +1,219 @@
+'use strict'
+
+const fs = require('bare-fs')
+const path = require('bare-path')
+const os = require('bare-os')
+const process = require('bare-process')
+
+const ImageClassifier = require('../../index')
+
+const platform = process.platform
+const isMobile = platform === 'ios' || platform === 'android'
+
+// Dynamic require via path.join — bare-pack would otherwise resolve the
+// script path at mobile bundle time and fail the lookup.
+let createPerformanceReporter
+const _scriptBase = path.join('..', '..', '..', '..', 'scripts', 'test-utils')
+try {
+  const perfReporterMod = require(path.join(_scriptBase, 'performance-reporter'))
+  perfReporterMod.configure({ fs, path, process, os })
+  createPerformanceReporter = perfReporterMod.createPerformanceReporter
+} catch (_) {
+  // No-op fallback for published-tarball runs that lack scripts/.
+  createPerformanceReporter = function (opts) {
+    return {
+      record () {},
+      toJSON () { return { schema_version: '1.0', addon: opts.addon, results: [] } },
+      writeReport () {},
+      writeStepSummary () {},
+      get length () { return 0 }
+    }
+  }
+}
+
+const _perfReporter = createPerformanceReporter({
+  addon: 'ggml-classification',
+  addonType: 'generic'
+})
+
+const _reportPath = path.resolve(__dirname, '../../test/results/performance-report.json')
+let _exitHookInstalled = false
+
+function _installExitHook () {
+  if (_exitHookInstalled) return
+  _exitHookInstalled = true
+  // Final write only triggers the GitHub Step Summary; the JSON file
+  // is already up to date thanks to the per-metric flush below.
+  process.on('exit', () => {
+    if (_perfReporter.length > 0) {
+      _perfReporter.writeReport(_reportPath)
+      _perfReporter.writeStepSummary()
+    }
+  })
+}
+
+function _flushReport () {
+  if (_perfReporter.length === 0) return
+  // Persist after every metric so SIGSEGV mid-suite still leaves a
+  // partial report on disk.
+  _perfReporter.writeReport(_reportPath)
+}
+
+const DESKTOP_TIMEOUT = 120 * 1000
+const MOBILE_TIMEOUT = 600 * 1000
+const TEST_TIMEOUT = isMobile ? MOBILE_TIMEOUT : DESKTOP_TIMEOUT
+
+function createLogger () {
+  return {
+    error: (msg) => console.log('[C++ ERROR]:', msg),
+    warn: (msg) => console.log('[C++ WARN]:', msg),
+    info: (msg) => console.log('[C++ INFO]:', msg),
+    debug: (msg) => console.log('[C++ DEBUG]:', msg),
+    getLevel: () => 'debug'
+  }
+}
+
+const IMAGE_DIR = path.resolve(__dirname, '..', 'images')
+
+const IMAGE_SAMPLES = [
+  { file: 'meal_1.jpg', expected: 'food' },
+  { file: 'meal_2.jpg', expected: 'food' },
+  { file: 'report_1.jpg', expected: 'report' },
+  { file: 'report_2.jpg', expected: 'report' },
+  { file: 'other_1.jpg', expected: 'other' },
+  { file: 'other_2.jpg', expected: 'other' }
+]
+
+const MODEL_FILENAME = 'mobilenetv3_3class_v3_fp16.gguf'
+// qvac-test-addon-mobile's metro.config.js whitelists asset extensions
+// `so, bin, model, bundle, raw, onnx`; `.gguf` is not in the list, so
+// `scripts/copy-mobile-test-assets.js` packages the weights with a
+// `.gguf.bin` suffix and the device-side lookup uses that name.
+const MOBILE_MODEL_FILENAME = MODEL_FILENAME + '.bin'
+
+// Regex strips both `file://` and `file:///abs/path` correctly; a
+// `.slice('file://'.length)` would leave a stray leading `/`.
+function _stripFileUrlPrefix (mapped) {
+  return mapped.replace(/^file:\/\//, '')
+}
+
+function _resolveMobileAsset (filename) {
+  if (!isMobile || typeof global === 'undefined' || !global.assetPaths) {
+    return null
+  }
+  const candidates = [
+    `../../testAssets/${filename}`,
+    `../mobile/testAssets/${filename}`,
+    `testAssets/${filename}`,
+    `../testAssets/${filename}`
+  ]
+  for (const key of candidates) {
+    const mapped = global.assetPaths[key]
+    if (mapped) return _stripFileUrlPrefix(mapped)
+  }
+  return null
+}
+
+/**
+ * Desktop: returns `undefined` so the constructor uses its bundled
+ * default. Mobile: throws synchronously when the asset is missing —
+ * a rejected promise during load() aborts the bare worklet.
+ */
+function resolveModelPath () {
+  if (isMobile) {
+    const resolved = _resolveMobileAsset(MOBILE_MODEL_FILENAME)
+    if (resolved) return resolved
+    throw new Error(
+      `Mobile asset not found in global.assetPaths: ${MOBILE_MODEL_FILENAME}. ` +
+      "Did 'npm run mobile:copy-prebuilds' run during test setup, " +
+      'and is `test/mobile/testAssets/' + MOBILE_MODEL_FILENAME + '` present?'
+    )
+  }
+
+  const desktopCandidates = [
+    path.resolve(__dirname, '..', 'mobile', 'testAssets', MODEL_FILENAME),
+    path.resolve(__dirname, '..', 'mobile', 'testAssets', MOBILE_MODEL_FILENAME),
+    path.resolve(__dirname, '..', '..', 'weights', MODEL_FILENAME)
+  ]
+  for (const candidate of desktopCandidates) {
+    if (fs.existsSync(candidate)) return candidate
+  }
+  return undefined
+}
+
+// Mobile: throw synchronously on miss for the same reason as
+// resolveModelPath() — see comment above.
+function _resolveImagePath (name) {
+  if (isMobile) {
+    const resolved = _resolveMobileAsset(name)
+    if (resolved) return resolved
+    const known = (typeof global !== 'undefined' && global.assetPaths)
+      ? Object.keys(global.assetPaths).slice(0, 8).join(', ')
+      : '(no global.assetPaths)'
+    throw new Error(
+      `Mobile test image not found in global.assetPaths: ${name}. ` +
+      "Did 'npm run mobile:copy-prebuilds' run during test setup, " +
+      'and is `test/mobile/testAssets/' + name + '` present? ' +
+      `assetPaths sample keys: [${known}]`
+    )
+  }
+  return path.join(IMAGE_DIR, name)
+}
+
+function loadImage (name) {
+  return fs.readFileSync(_resolveImagePath(name))
+}
+
+function makeClassifier (overrides) {
+  const opts = {
+    modelPath: resolveModelPath(),
+    logger: createLogger()
+  }
+  if (overrides) Object.assign(opts, overrides)
+  return new ImageClassifier(opts)
+}
+
+// Errors swallowed so a failing teardown can't mask the assertion
+// that triggered it.
+async function cleanupClassifier (classifier) {
+  if (!classifier) return
+  try {
+    await classifier.unload()
+  } catch (_) {}
+}
+
+function recordMetric (label, totalTimeMs, input) {
+  _perfReporter.record(label, {
+    total_time_ms: Math.round(totalTimeMs)
+  }, {
+    input: input || null
+  })
+  _installExitHook()
+  _flushReport()
+}
+
+function recordLoadTime (label, loadTimeMs) {
+  _perfReporter.record(label, {
+    total_time_ms: Math.round(loadTimeMs)
+  }, {
+    input: 'load'
+  })
+  _installExitHook()
+  _flushReport()
+}
+
+module.exports = {
+  platform,
+  isMobile,
+  TEST_TIMEOUT,
+  IMAGE_SAMPLES,
+  IMAGE_DIR,
+  MODEL_FILENAME,
+  loadImage,
+  createLogger,
+  recordMetric,
+  recordLoadTime,
+  resolveModelPath,
+  makeClassifier,
+  cleanupClassifier
+}
diff --git a/packages/classification-ggml/test/mobile/README.md b/packages/classification-ggml/test/mobile/README.md
new file mode 100644
index 0000000000..932161aa27
--- /dev/null
+++ b/packages/classification-ggml/test/mobile/README.md
@@ -0,0 +1,44 @@
+# Mobile tests
+
+Mobile-specific test infrastructure for `@qvac/classification-ggml`. Runs
+the same integration suite as desktop (`test/integration/*.test.js`) on
+Android and iOS devices via the shared `qvac-test-addon-mobile`
+framework.
+
+## Structure
+
+- `integration-runtime.cjs` — loaded by the mobile framework at boot.
+  Exposes `global.runIntegrationModule(relPath, options)`, which
+  imports one integration module, triggers a GC pass, and sleeps for
+  a short cooldown before returning.
+- `integration.auto.cjs` — **auto-generated** wrapper file. Contains
+  one `async function runXxx(options)` per `*.test.js` file under
+  `test/integration/`. **Do not edit manually.** Re-generate with
+  `npm run test:mobile:generate`.
+- `testAssets/` — optional non-test resources that must be pushed to
+  the device (none required for this addon; the GGUF weights ship
+  inside the npm package at `weights/`).
+
+## Regenerating
+
+```bash
+npm run test:mobile:generate   # bare ./scripts/generate-mobile-integration-tests.js
+npm run test:mobile:validate   # node ./scripts/validate-mobile-tests.js
+```
+
+## What ships in npm
+
+The package publishes `test/mobile/` **and** `test/integration/` (see
+the `files` field in `package.json`) so the mobile framework can
+resolve the `../integration/*.test.js` imports from the installed npm
+tree. The GGUF model is bundled under `weights/` and is resolved by the
+same default-path logic used on desktop.
+
+## Lifecycle caveat on mobile
+
+The underlying `@qvac/qvac-lib-inference-addon-cpp` `JsLogger` holds a
+process-wide static `uv_async_t` whose lifecycle is not safe across
+rapid classifier create/destroy cycles. The `ImageClassifier`
+`nativeLogger` option is therefore **off by default** on all platforms,
+including mobile. JS-level logging still flows through the caller's
+`logger`.
diff --git a/packages/classification-ggml/test/mobile/integration-runtime.cjs b/packages/classification-ggml/test/mobile/integration-runtime.cjs
new file mode 100644
index 0000000000..4819a963e5
--- /dev/null
+++ b/packages/classification-ggml/test/mobile/integration-runtime.cjs
@@ -0,0 +1,37 @@
+'use strict'
+
+// Shared mobile integration runtime. The qvac-test-addon-mobile framework
+// loads the sibling `integration.auto.cjs` on-device, which calls back
+// into `runIntegrationModule(...)` to execute one integration test module
+// at a time. Between modules we force a GC (if exposed by the runtime)
+// and sleep briefly so native resources allocated by libggml / bare-stream
+// are reclaimed before the next module begins.
+
+const path = require('bare-path')
+const fs = require('bare-fs')
+const { pathToFileURL } = require('bare-url')
+
+const GC_PAUSE_MS = 3000
+
+async function runIntegrationModule (relativeModulePath, options = {}) {
+  const modulePath = path.join(__dirname, relativeModulePath)
+
+  if (!fs.existsSync(modulePath)) {
+    console.warn(`[integration-runner] Missing module: ${relativeModulePath}`)
+    return 'missing'
+  }
+
+  const moduleUrl = pathToFileURL(modulePath).href
+  await import(moduleUrl)
+
+  if (global.gc) {
+    global.gc()
+    console.log(`[integration-runner] GC triggered after ${relativeModulePath}`)
+  }
+  await new Promise(resolve => setTimeout(resolve, options.gcPauseMs || GC_PAUSE_MS))
+  console.log(`[integration-runner] ${GC_PAUSE_MS}ms cooldown complete`)
+
+  return modulePath
+}
+
+global.runIntegrationModule = runIntegrationModule
diff --git a/packages/classification-ggml/test/mobile/integration.auto.cjs b/packages/classification-ggml/test/mobile/integration.auto.cjs
new file mode 100644
index 0000000000..03353158ff
--- /dev/null
+++ b/packages/classification-ggml/test/mobile/integration.auto.cjs
@@ -0,0 +1,12 @@
+'use strict'
+require('./integration-runtime.cjs')
+
+/* global runIntegrationModule */
+
+async function runClassify (options = {}) { // eslint-disable-line no-unused-vars
+  return runIntegrationModule('../integration/classify.test.js', options)
+}
+
+async function runErrorCases (options = {}) { // eslint-disable-line no-unused-vars
+  return runIntegrationModule('../integration/error-cases.test.js', options)
+}
diff --git a/packages/classification-ggml/test/mobile/testAssets/.gitignore b/packages/classification-ggml/test/mobile/testAssets/.gitignore
new file mode 100644
index 0000000000..8ecee66652
--- /dev/null
+++ b/packages/classification-ggml/test/mobile/testAssets/.gitignore
@@ -0,0 +1,17 @@
+# Ignore any large model or image files placed here by ad-hoc scripts.
+# `scripts/copy-mobile-test-assets.js` populates this directory at
+# build/test time with:
+#   - the FP16 GGUF weights blob (renamed to `*.gguf.bin` so metro
+#     treats it as a binary asset rather than a JS module)
+#   - the integration test images from `test/images/*.{jpg,jpeg,png}`
+# Both kinds of files are derived artifacts and must not be committed.
+*.gguf
+*.bin
+*.safetensors
+*.ckpt
+*.jpg
+*.jpeg
+*.png
+
+# Keep this directory tracked.
+!.gitignore
diff --git a/packages/classification-ggml/test/unit/CMakeLists.txt b/packages/classification-ggml/test/unit/CMakeLists.txt
new file mode 100644
index 0000000000..55ee58a61e
--- /dev/null
+++ b/packages/classification-ggml/test/unit/CMakeLists.txt
@@ -0,0 +1,63 @@
+cmake_minimum_required(VERSION 3.25)
+
+project(ggml_classification_tests LANGUAGES C CXX)
+
+find_package(GTest CONFIG REQUIRED)
+
+option(ENABLE_COVERAGE "Enable coverage instrumentation for unit tests" OFF)
+
+set(TEST_SOURCES
+  classification_model_test.cpp
+  preprocessor_test.cpp
+  ${CMAKE_SOURCE_DIR}/addon/src/model-interface/ClassificationModel.cpp
+  ${CMAKE_SOURCE_DIR}/addon/src/model-interface/ImagePreprocessor.cpp
+  ${CMAKE_SOURCE_DIR}/addon/src/model-interface/MobileNetGraph.cpp
+)
+
+add_executable(addon-test ${TEST_SOURCES})
+target_compile_features(addon-test PRIVATE cxx_std_20)
+
+target_compile_options(addon-test PRIVATE -Wall -Wextra -Wfatal-errors -g)
+target_compile_definitions(addon-test PRIVATE GTEST_HAS_POSIX_RE=0)
+
+if(NOT WIN32)
+  target_compile_options(addon-test PRIVATE -fno-omit-frame-pointer)
+endif()
+
+target_include_directories(
+  addon-test
+  PRIVATE
+  ${CMAKE_SOURCE_DIR}/addon/src
+  ${QVAC_LIB_INFERENCE_ADDON_CPP_INCLUDE_DIRS}
+  ${STB_INCLUDE_DIRS}
+)
+
+target_link_libraries(
+  addon-test
+  PRIVATE
+    ggml::ggml
+    ggml::ggml-base
+    ggml::ggml-cpu
+    GTest::gtest
+    GTest::gtest_main
+)
+
+if(ENABLE_COVERAGE)
+  if(CMAKE_CXX_COMPILER_ID MATCHES "Clang|GNU")
+    target_compile_options(addon-test PRIVATE -fprofile-instr-generate -fcoverage-mapping)
+    target_link_options(addon-test PRIVATE -fprofile-instr-generate)
+  endif()
+endif()
+
+if(NOT WIN32)
+  target_link_libraries(addon-test PRIVATE -fsanitize=address)
+endif()
+
+if(WIN32)
+  target_link_libraries(addon-test PRIVATE msvcrt.lib)
+endif()
+
+add_test(NAME ClassificationModelTests COMMAND addon-test)
+set_tests_properties(ClassificationModelTests PROPERTIES
+  WORKING_DIRECTORY ${CMAKE_SOURCE_DIR}
+  TIMEOUT 600)
diff --git a/packages/classification-ggml/test/unit/all.js b/packages/classification-ggml/test/unit/all.js
new file mode 100644
index 0000000000..b3bd8d1021
--- /dev/null
+++ b/packages/classification-ggml/test/unit/all.js
@@ -0,0 +1,13 @@
+// This runner is auto-generated by Brittle
+
+runTests()
+
+async function runTests () {
+  const test = (await import('brittle')).default
+
+  test.pause()
+
+  await import('./map-addon-event.test.js')
+
+  test.resume()
+}
diff --git a/packages/classification-ggml/test/unit/classification_model_test.cpp b/packages/classification-ggml/test/unit/classification_model_test.cpp
new file mode 100644
index 0000000000..d32a8aa305
--- /dev/null
+++ b/packages/classification-ggml/test/unit/classification_model_test.cpp
@@ -0,0 +1,142 @@
+#include <gtest/gtest.h>
+
+#include <cstdlib>
+#include <filesystem>
+
+#include "model-interface/ClassificationModel.hpp"
+#include "model-interface/ImagePreprocessor.hpp"
+#include "model-interface/MobileNetGraph.hpp"
+
+namespace qcc = classification_ggml;
+namespace qpp = classification_ggml::preprocess;
+namespace qgraph = classification_ggml::graph;
+
+namespace {
+
+/// Resolves the FP16 weights path. Priority:
+/// 1. QVAC_CLASSIFICATION_MODEL_PATH env var (used by CI).
+/// 2. Bundled weights/ directory, walked up from the current binary.
+std::string findWeightsPath() {
+  const char* env = std::getenv("QVAC_CLASSIFICATION_MODEL_PATH");
+  if (env != nullptr && std::filesystem::exists(env)) {
+    return env;
+  }
+  std::filesystem::path here = std::filesystem::current_path();
+  for (int i = 0; i < 6; ++i) {
+    const auto candidate =
+        here / "weights" / "mobilenetv3_3class_v3_fp16.gguf";
+    if (std::filesystem::exists(candidate)) {
+      return candidate.string();
+    }
+    if (!here.has_parent_path()) break;
+    here = here.parent_path();
+  }
+  return "";
+}
+
+class ClassificationModelTest : public ::testing::Test {
+protected:
+  void SetUp() override {
+    weightsPath_ = findWeightsPath();
+    if (weightsPath_.empty()) {
+      GTEST_SKIP() << "Model weights file not found; skipping (set "
+                      "QVAC_CLASSIFICATION_MODEL_PATH to run).";
+    }
+  }
+  std::string weightsPath_;
+};
+
+} // namespace
+
+TEST(MobileNetGraphTest, ArchitectureMatches34ConvAnd2Linear) {
+  // Static architecture sanity check: 1 (stem) + Σ convs-per-block + 1 (tail) = 34
+  int totalConvs = 1 /*stem*/ + 1 /*tail*/;
+  int totalSeBlocks = 0;
+  for (const qgraph::BlockConfig& b : qgraph::kBlocks) {
+    const bool hasExpand = b.expandedChannels != b.inputChannels;
+    // expand + depthwise + project
+    totalConvs += (hasExpand ? 1 : 0) + 1 + 1;
+    if (b.useSe) ++totalSeBlocks;
+  }
+  EXPECT_EQ(totalConvs, 34);
+  EXPECT_EQ(totalSeBlocks, 9)
+      << "MobileNetV3-Small has 9 SE blocks (features 1, 4-11)";
+}
+
+TEST_F(ClassificationModelTest, LoadSucceedsAndRunsInference) {
+  qcc::ClassificationModel model(weightsPath_);
+  ASSERT_NO_THROW(model.load());
+
+  // Feed a neutral gray image; we only care that it runs and returns 3 valid
+  // probabilities, not about accuracy in this test.
+  std::vector<uint8_t> rawGray(qpp::kInputSize * qpp::kInputSize * 3, 128);
+  qcc::ClassifyInput input;
+  input.data = rawGray;
+  input.rawRgb =
+      qcc::RawRgbDims{qpp::kInputSize, qpp::kInputSize, 3};
+
+  std::any out;
+  ASSERT_NO_THROW(out = model.process(input));
+  const auto* result = std::any_cast<qcc::ClassifyOutput>(&out);
+  ASSERT_NE(result, nullptr);
+  ASSERT_EQ(result->results.size(), qgraph::kNumClasses);
+
+  float sum = 0.0F;
+  for (const qcc::ClassifyResult& r : result->results) {
+    EXPECT_GE(r.confidence, 0.0F);
+    EXPECT_LE(r.confidence, 1.0F);
+    EXPECT_FALSE(r.label.empty());
+    sum += r.confidence;
+  }
+  EXPECT_NEAR(sum, 1.0F, 1e-3F) << "softmax probabilities should sum to ~1.0";
+  EXPECT_GE(result->results[0].confidence, result->results[1].confidence)
+      << "results must be sorted by confidence descending";
+}
+
+TEST_F(ClassificationModelTest, SequentialInferenceIsDeterministic) {
+  qcc::ClassificationModel model(weightsPath_);
+  ASSERT_NO_THROW(model.load());
+
+  std::vector<uint8_t> rawGray(qpp::kInputSize * qpp::kInputSize * 3, 128);
+  qcc::ClassifyInput input;
+  input.data = rawGray;
+  input.rawRgb =
+      qcc::RawRgbDims{qpp::kInputSize, qpp::kInputSize, 3};
+
+  std::any a = model.process(input);
+  std::any b = model.process(input);
+  const auto* ra = std::any_cast<qcc::ClassifyOutput>(&a);
+  const auto* rb = std::any_cast<qcc::ClassifyOutput>(&b);
+  ASSERT_NE(ra, nullptr);
+  ASSERT_NE(rb, nullptr);
+  ASSERT_EQ(ra->results.size(), rb->results.size());
+  for (size_t i = 0; i < ra->results.size(); ++i) {
+    EXPECT_EQ(ra->results[i].label, rb->results[i].label);
+    EXPECT_NEAR(ra->results[i].confidence, rb->results[i].confidence, 1e-6F);
+  }
+}
+
+TEST_F(ClassificationModelTest, TopKFiltersResults) {
+  qcc::ClassificationModel model(weightsPath_);
+  ASSERT_NO_THROW(model.load());
+
+  std::vector<uint8_t> rawGray(qpp::kInputSize * qpp::kInputSize * 3, 128);
+  qcc::ClassifyInput input;
+  input.data = rawGray;
+  input.rawRgb =
+      qcc::RawRgbDims{qpp::kInputSize, qpp::kInputSize, 3};
+  input.topK = 1;
+
+  std::any out = model.process(input);
+  const auto* res = std::any_cast<qcc::ClassifyOutput>(&out);
+  ASSERT_NE(res, nullptr);
+  EXPECT_EQ(res->results.size(), 1U);
+}
+
+TEST(BatchNormFoldingTest, EpsilonIsZeroPointZeroZeroOne) {
+  // The spec fixes BN epsilon at 0.001 (architecture-specific, matches the
+  // original MobileNetV3 paper and the torchvision `mobilenet_v3_small`
+  // default). Guards against a regression to the generic 1e-5 that causes
+  // normalisation drift to accumulate across all 34 layers of the network.
+  EXPECT_FLOAT_EQ(qgraph::kBatchNormEpsilon, 0.001F);
+}
diff --git a/packages/classification-ggml/test/unit/map-addon-event.test.js b/packages/classification-ggml/test/unit/map-addon-event.test.js
new file mode 100644
index 0000000000..e7b0ad452a
--- /dev/null
+++ b/packages/classification-ggml/test/unit/map-addon-event.test.js
@@ -0,0 +1,81 @@
+'use strict'
+
+const test = require('brittle')
+const { mapAddonEvent } = require('../../addon.js')
+
+test('Array payload maps to Output regardless of event name', function (t) {
+  const data = [{ label: 'food', confidence: 0.9 }]
+  const result = mapAddonEvent('struct ...::ClassifyOutput', data, null)
+  t.is(result.type, 'Output')
+  t.is(result.data, data)
+  t.is(result.error, null)
+})
+
+test('Plain non-array object maps to terminal JobEnded', function (t) {
+  // Models the upstream JobRunner's stats trailer, whose RTTI event name
+  // is the raw `std::vector<std::pair<...>>` — there is no literal
+  // `JobEnded` substring in the event for this addon.
+  const stats = { total_time_ms: 47.3 }
+  const result = mapAddonEvent('class std::vector<std::pair<...>>', stats, null)
+  t.is(result.type, 'JobEnded', 'shape-keyed: object → terminal')
+  t.is(result.data, stats)
+  t.is(result.error, null)
+})
+
+test('Event name containing "Error" maps to Error with rawError', function (t) {
+  const err = new Error('boom')
+  const result = mapAddonEvent('class qvac_errors::SomeError', null, err)
+  t.is(result.type, 'Error')
+  t.is(result.data, null)
+  t.is(result.error, err)
+})
+
+test('Event name containing "LogMsg" maps to LogMsg (not Output) for string data', function (t) {
+  const result = mapAddonEvent('class JsLogMsgOutputHandler', 'native log line', null)
+  t.is(result.type, 'LogMsg', 'name-match wins over the Array fallback')
+  t.is(result.data, 'native log line')
+  t.is(result.error, null)
+})
+
+test('Event name containing "JobStarted" returns null (drop)', function (t) {
+  const result = mapAddonEvent('struct ...::JobStarted', null, null)
+  t.is(result, null)
+})
+
+test('Event name containing "JobEnded" maps to JobEnded (defensive name path)', function (t) {
+  const result = mapAddonEvent('struct ...::JobEnded', { ok: true }, null)
+  t.is(result.type, 'JobEnded')
+  t.alike(result.data, { ok: true })
+})
+
+test('Unknown event with primitive data falls through preserving event name', function (t) {
+  const result = mapAddonEvent('UnknownEvent', 42, null)
+  t.is(result.type, 'UnknownEvent')
+  t.is(result.data, 42)
+  t.is(result.error, null)
+})
+
+test('Unknown event with null data falls through preserving event name', function (t) {
+  const result = mapAddonEvent('UnknownEvent', null, null)
+  t.is(result.type, 'UnknownEvent')
+  t.is(result.data, null)
+})
+
+test('Non-string event with array data still maps to Output', function (t) {
+  // Defensive: even if upstream ever emits a non-string event marker,
+  // payload-shape keying keeps us safe for arrays.
+  const result = mapAddonEvent(undefined, [1, 2, 3], null)
+  t.is(result.type, 'Output')
+  t.alike(result.data, [1, 2, 3])
+})
+
+test('Object data with a nested results array still routes to JobEnded (regression guard)', function (t) {
+  // If a future C++ change wraps ClassifyOutput in `{ results: [...] }`,
+  // this branch silently misclassifies it as JobEnded. The integration
+  // suite would notice via classify() resolving to undefined; this unit
+  // test pins down the current shape-keyed behaviour so the regression
+  // is caught at the unit level, not at integration time.
+  const result = mapAddonEvent('struct ...::SomeWrappedOutput', { results: [{ label: 'x', confidence: 1 }] }, null)
+  t.is(result.type, 'JobEnded', 'TODAY: object data wins over inner array; revisit if upstream wraps Output in an object')
+  t.alike(result.data.results, [{ label: 'x', confidence: 1 }])
+})
diff --git a/packages/classification-ggml/test/unit/preprocessor_test.cpp b/packages/classification-ggml/test/unit/preprocessor_test.cpp
new file mode 100644
index 0000000000..9021d02a91
--- /dev/null
+++ b/packages/classification-ggml/test/unit/preprocessor_test.cpp
@@ -0,0 +1,246 @@
+#include <gtest/gtest.h>
+
+#include <cstdio>
+#include <filesystem>
+#include <fstream>
+#include <vector>
+
+#include "model-interface/ImagePreprocessor.hpp"
+
+using namespace classification_ggml::preprocess;
+
+namespace {
+
+// Walks up from the current working directory looking for the given
+// repo-relative test image. Mirrors the pattern in
+// classification_model_test.cpp::findWeightsPath().
+std::vector<uint8_t> readTestImage(const std::string& name) {
+  std::filesystem::path here = std::filesystem::current_path();
+  for (int i = 0; i < 6; ++i) {
+    const auto candidate = here / "test" / "images" / name;
+    if (std::filesystem::exists(candidate)) {
+      std::ifstream f(candidate, std::ios::binary);
+      f.seekg(0, std::ios::end);
+      const std::streamsize size = f.tellg();
+      f.seekg(0, std::ios::beg);
+      std::vector<uint8_t> buf(static_cast<size_t>(size));
+      f.read(reinterpret_cast<char*>(buf.data()), size);
+      return buf;
+    }
+    if (!here.has_parent_path()) break;
+    here = here.parent_path();
+  }
+  return {};
+}
+
+} // namespace
+
+TEST(PreprocessorTest, MagicBytesDetectJpeg) {
+  const std::array<uint8_t, 4> jpeg = {0xFF, 0xD8, 0xFF, 0xE0};
+  EXPECT_TRUE(isEncodedImage({jpeg.data(), jpeg.size()}));
+}
+
+TEST(PreprocessorTest, MagicBytesDetectPng) {
+  const std::array<uint8_t, 8> png = {
+      0x89, 0x50, 0x4E, 0x47, 0x0D, 0x0A, 0x1A, 0x0A};
+  EXPECT_TRUE(isEncodedImage({png.data(), png.size()}));
+}
+
+TEST(PreprocessorTest, MagicBytesRejectBmp) {
+  const std::array<uint8_t, 4> bmp = {0x42, 0x4D, 0x00, 0x00};
+  EXPECT_FALSE(isEncodedImage({bmp.data(), bmp.size()}));
+}
+
+TEST(PreprocessorTest, ValidateRawRgbChecksChannelCount) {
+  std::vector<uint8_t> buf(4 * 4 * 4, 0);
+  EXPECT_THROW(validateRawRgb(buf, 4, 4, 4), std::exception);
+}
+
+TEST(PreprocessorTest, ValidateRawRgbChecksBufferSize) {
+  std::vector<uint8_t> buf(5, 0);
+  EXPECT_THROW(validateRawRgb(buf, 4, 4, 3), std::exception);
+}
+
+TEST(PreprocessorTest, ValidateRawRgbAccepts3Channels) {
+  std::vector<uint8_t> buf(4 * 4 * 3, 0);
+  EXPECT_NO_THROW(validateRawRgb(buf, 4, 4, 3));
+}
+
+TEST(PreprocessorTest, EmptyBufferIsRejected) {
+  std::vector<uint8_t> buf;
+  EXPECT_THROW(preprocessToTensor(buf, 0, 0, 0), std::exception);
+}
+
+TEST(PreprocessorTest, NormalizeToWhcnProducesExpectedSize) {
+  std::vector<uint8_t> rgb(kInputSize * kInputSize * kChannels, 128);
+  std::vector<float> out = normalizeToWhcn(rgb);
+  EXPECT_EQ(out.size(),
+            static_cast<size_t>(kInputSize) * kInputSize * kChannels);
+  // Pixel value 128/255 is close to 0.502; subtracting ImageNet means and
+  // dividing by std should produce values well inside [-3, 3] for all
+  // channels.
+  for (float v : out) {
+    EXPECT_GT(v, -3.0F);
+    EXPECT_LT(v, 3.0F);
+  }
+}
+
+TEST(PreprocessorTest, ResizeProducesExpectedDimensions) {
+  std::vector<uint8_t> src(10 * 10 * 3, 200);
+  std::vector<uint8_t> resized = resizeToInput(src, 10, 10);
+  EXPECT_EQ(resized.size(),
+            static_cast<size_t>(kInputSize) * kInputSize * kChannels);
+}
+
+TEST(PreprocessorTest, NormalizeToWhcnChannelFirstLayout) {
+  // Fill plane with (255, 0, 0) red; verify R channel first, then G, then B.
+  std::vector<uint8_t> rgb(kInputSize * kInputSize * kChannels, 0);
+  for (size_t i = 0; i < static_cast<size_t>(kInputSize) * kInputSize; ++i) {
+    rgb[i * 3 + 0] = 255; // R
+  }
+  std::vector<float> out = normalizeToWhcn(rgb);
+  const size_t plane = static_cast<size_t>(kInputSize) * kInputSize;
+  // R channel plane: normalized (1.0 - 0.485) / 0.229 ≈ 2.248
+  EXPECT_NEAR(out[0], (1.0F - kImageNetMean[0]) / kImageNetStd[0], 1e-3F);
+  // G channel plane (offset = plane) starts from 0.
+  EXPECT_NEAR(out[plane], (0.0F - kImageNetMean[1]) / kImageNetStd[1], 1e-3F);
+  // B channel plane (offset = 2*plane) starts from 0.
+  EXPECT_NEAR(out[2 * plane], (0.0F - kImageNetMean[2]) / kImageNetStd[2], 1e-3F);
+}
+
+// -------- decodeToRgb coverage --------
+
+TEST(PreprocessorTest, DecodeToRgbDecodesValidJpeg) {
+  std::vector<uint8_t> jpeg = readTestImage("meal_1.jpg");
+  if (jpeg.empty()) {
+    GTEST_SKIP() << "test/images/meal_1.jpg not found; skipping.";
+  }
+  uint32_t width = 0;
+  uint32_t height = 0;
+  std::vector<uint8_t> rgb = decodeToRgb(jpeg, width, height);
+  EXPECT_GT(width, 0u);
+  EXPECT_GT(height, 0u);
+  EXPECT_LE(width, kMaxImageDimension);
+  EXPECT_LE(height, kMaxImageDimension);
+  EXPECT_EQ(
+      rgb.size(),
+      static_cast<size_t>(width) * height * kChannels);
+}
+
+TEST(PreprocessorTest, DecodeToRgbRejectsEmptyBuffer) {
+  std::vector<uint8_t> empty;
+  uint32_t w = 0;
+  uint32_t h = 0;
+  EXPECT_THROW(decodeToRgb(empty, w, h), std::exception);
+}
+
+TEST(PreprocessorTest, DecodeToRgbRejectsCorruptedBytes) {
+  // 16 random bytes that do not parse as any image format.
+  std::vector<uint8_t> garbage = {0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
+                                  0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E,
+                                  0x0F, 0x10};
+  uint32_t w = 0;
+  uint32_t h = 0;
+  EXPECT_THROW(decodeToRgb(garbage, w, h), std::exception);
+}
+
+TEST(PreprocessorTest, DecodeToRgbRejectsTruncatedJpeg) {
+  std::vector<uint8_t> jpeg = readTestImage("meal_1.jpg");
+  if (jpeg.empty()) {
+    GTEST_SKIP() << "test/images/meal_1.jpg not found; skipping.";
+  }
+  // Drop everything past the SOI + a handful of header bytes; stbi must
+  // reject the resulting truncated stream rather than silently producing
+  // a partial image.
+  jpeg.resize(8);
+  uint32_t w = 0;
+  uint32_t h = 0;
+  EXPECT_THROW(decodeToRgb(jpeg, w, h), std::exception);
+}
+
+// -------- preprocessToTensor full-pipeline coverage --------
+
+TEST(PreprocessorTest, PreprocessToTensorAcceptsEncodedJpeg) {
+  std::vector<uint8_t> jpeg = readTestImage("meal_1.jpg");
+  if (jpeg.empty()) {
+    GTEST_SKIP() << "test/images/meal_1.jpg not found; skipping.";
+  }
+  std::vector<float> out = preprocessToTensor(jpeg, 0, 0, 0);
+  EXPECT_EQ(
+      out.size(),
+      static_cast<size_t>(kInputSize) * kInputSize * kChannels);
+  for (float v : out) {
+    EXPECT_TRUE(std::isfinite(v));
+  }
+}
+
+TEST(PreprocessorTest, PreprocessToTensorAcceptsRawRgb) {
+  // 16x16 raw RGB block, every channel = 64.
+  constexpr uint32_t kSide = 16;
+  std::vector<uint8_t> raw(
+      static_cast<size_t>(kSide) * kSide * kChannels, 64);
+  std::vector<float> out = preprocessToTensor(raw, kSide, kSide, kChannels);
+  EXPECT_EQ(
+      out.size(),
+      static_cast<size_t>(kInputSize) * kInputSize * kChannels);
+  for (float v : out) {
+    EXPECT_TRUE(std::isfinite(v));
+  }
+}
+
+TEST(PreprocessorTest, PreprocessToTensorRejectsBmpWithoutDimensions) {
+  // BMP header magic + a few padding bytes; treated as encoded (no
+  // declared dims) -> must reject because BMP is not a supported
+  // encoded format.
+  std::vector<uint8_t> bmp = {0x42, 0x4D, 0x46, 0x00, 0x00, 0x00,
+                              0x00, 0x00, 0x00, 0x00};
+  EXPECT_THROW(preprocessToTensor(bmp, 0, 0, 0), std::exception);
+}
+
+TEST(PreprocessorTest, PreprocessToTensorRejectsRawWithMissingDims) {
+  // Sized like a 4x4 RGB buffer but channels not declared -> caller
+  // must pass width/height/channels for the raw path.
+  std::vector<uint8_t> raw(4 * 4 * 3, 0);
+  EXPECT_THROW(preprocessToTensor(raw, 0, 0, 0), std::exception);
+}
+
+// -------- validateRawRgb edge cases --------
+
+TEST(PreprocessorTest, ValidateRawRgbRejectsEmptyBuffer) {
+  std::vector<uint8_t> empty;
+  EXPECT_THROW(validateRawRgb(empty, 4, 4, 3), std::exception);
+}
+
+TEST(PreprocessorTest, ValidateRawRgbRejectsZeroWidth) {
+  std::vector<uint8_t> buf(4 * 3, 0);
+  EXPECT_THROW(validateRawRgb(buf, 0, 4, 3), std::exception);
+}
+
+TEST(PreprocessorTest, ValidateRawRgbRejectsZeroHeight) {
+  std::vector<uint8_t> buf(4 * 3, 0);
+  EXPECT_THROW(validateRawRgb(buf, 4, 0, 3), std::exception);
+}
+
+TEST(PreprocessorTest, ValidateRawRgbRejectsOverKMaxImageDimensionWidth) {
+  // We do not allocate the full buffer (just enough to satisfy the
+  // size check that runs after the dimension check); dimension check
+  // must reject before any other validation.
+  std::vector<uint8_t> buf(8, 0);
+  EXPECT_THROW(
+      validateRawRgb(buf, kMaxImageDimension + 1, 1, 3), std::exception);
+}
+
+TEST(PreprocessorTest, ValidateRawRgbRejectsOverKMaxImageDimensionHeight) {
+  std::vector<uint8_t> buf(8, 0);
+  EXPECT_THROW(
+      validateRawRgb(buf, 1, kMaxImageDimension + 1, 3), std::exception);
+}
+
+// -------- normalizeToWhcn invalid input size --------
+
+TEST(PreprocessorTest, NormalizeToWhcnRejectsWrongInputSize) {
+  // One byte short of the expected (kInputSize^2 * kChannels) buffer.
+  std::vector<uint8_t> buf(
+      static_cast<size_t>(kInputSize) * kInputSize * kChannels - 1, 0);
+  EXPECT_THROW(normalizeToWhcn(buf), std::exception);
+}
diff --git a/packages/classification-ggml/tsconfig.dts.json b/packages/classification-ggml/tsconfig.dts.json
new file mode 100644
index 0000000000..fbc1764f1c
--- /dev/null
+++ b/packages/classification-ggml/tsconfig.dts.json
@@ -0,0 +1,15 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "commonjs",
+    "moduleResolution": "node",
+    "strict": true,
+    "noEmit": true,
+    "skipLibCheck": true,
+    "esModuleInterop": true,
+    "forceConsistentCasingInFileNames": true
+  },
+  "include": [
+    "index.d.ts"
+  ]
+}
diff --git a/packages/classification-ggml/vcpkg-configuration.json b/packages/classification-ggml/vcpkg-configuration.json
new file mode 100644
index 0000000000..5fe2b9f2a8
--- /dev/null
+++ b/packages/classification-ggml/vcpkg-configuration.json
@@ -0,0 +1,18 @@
+{
+  "default-registry": {
+    "kind": "git",
+    "baseline": "803c0d119ea002694963e89237c207ff6ecf47f6",
+    "repository": "https://github.com/tetherto/qvac-registry-vcpkg.git"
+  },
+  "registries": [
+    {
+      "kind": "git",
+      "baseline": "16c71a39e5a0fc0bdb3fad03beef8f38ee00ee3b",
+      "repository": "https://github.com/microsoft/vcpkg",
+      "packages": [
+        "gtest",
+        "stb"
+      ]
+    }
+  ]
+}
diff --git a/packages/classification-ggml/vcpkg.json b/packages/classification-ggml/vcpkg.json
new file mode 100644
index 0000000000..5f81786e1f
--- /dev/null
+++ b/packages/classification-ggml/vcpkg.json
@@ -0,0 +1,26 @@
+{
+  "dependencies": [
+    {
+      "name": "qvac-fabric",
+      "version>=": "8189.0.2",
+      "default-features": false
+    },
+    {
+      "name": "qvac-lib-inference-addon-cpp",
+      "version>=": "1.1.7#1"
+    },
+    {
+      "name": "qvac-lint-cpp",
+      "version>=": "1.4.4#3"
+    },
+    "stb"
+  ],
+  "features": {
+    "tests": {
+      "description": "Build tests",
+      "dependencies": [
+        "gtest"
+      ]
+    }
+  }
+}
diff --git a/packages/classification-ggml/vcpkg/toolchains/linux-clang.cmake b/packages/classification-ggml/vcpkg/toolchains/linux-clang.cmake
new file mode 100644
index 0000000000..f06d219a74
--- /dev/null
+++ b/packages/classification-ggml/vcpkg/toolchains/linux-clang.cmake
@@ -0,0 +1,4 @@
+set(CMAKE_C_COMPILER "clang")
+set(CMAKE_CXX_COMPILER "clang++")
+
+include("$ENV{VCPKG_ROOT}/scripts/toolchains/linux.cmake")
diff --git a/packages/classification-ggml/vcpkg/triplets/arm64-linux.cmake b/packages/classification-ggml/vcpkg/triplets/arm64-linux.cmake
new file mode 100644
index 0000000000..77c0e6b318
--- /dev/null
+++ b/packages/classification-ggml/vcpkg/triplets/arm64-linux.cmake
@@ -0,0 +1,9 @@
+set(VCPKG_TARGET_ARCHITECTURE arm64)
+set(VCPKG_CRT_LINKAGE dynamic)
+set(VCPKG_LIBRARY_LINKAGE static)
+set(VCPKG_CMAKE_SYSTEM_NAME Linux)
+
+set(VCPKG_CHAINLOAD_TOOLCHAIN_FILE "${CMAKE_CURRENT_LIST_DIR}/../toolchains/linux-clang.cmake")
+set(VCPKG_C_FLAGS "-fPIC")
+set(VCPKG_CXX_FLAGS "-fPIC -stdlib=libc++")
+set(VCPKG_LINKER_FLAGS "-stdlib=libc++")
diff --git a/packages/classification-ggml/vcpkg/triplets/x64-linux.cmake b/packages/classification-ggml/vcpkg/triplets/x64-linux.cmake
new file mode 100644
index 0000000000..7660720b49
--- /dev/null
+++ b/packages/classification-ggml/vcpkg/triplets/x64-linux.cmake
@@ -0,0 +1,9 @@
+set(VCPKG_TARGET_ARCHITECTURE x64)
+set(VCPKG_CRT_LINKAGE dynamic)
+set(VCPKG_LIBRARY_LINKAGE static)
+set(VCPKG_CMAKE_SYSTEM_NAME Linux)
+
+set(VCPKG_CHAINLOAD_TOOLCHAIN_FILE "${CMAKE_CURRENT_LIST_DIR}/../toolchains/linux-clang.cmake")
+set(VCPKG_C_FLAGS "-fPIC")
+set(VCPKG_CXX_FLAGS "-fPIC -stdlib=libc++")
+set(VCPKG_LINKER_FLAGS "-stdlib=libc++")
diff --git a/packages/classification-ggml/weights/mobilenetv3_3class_v3_fp16.gguf b/packages/classification-ggml/weights/mobilenetv3_3class_v3_fp16.gguf
new file mode 100644
index 0000000000..671a3b3be1
Binary files /dev/null and b/packages/classification-ggml/weights/mobilenetv3_3class_v3_fp16.gguf differ