Unsupported model type: whisper and CORS error #314

rojitdhakal · 2023-09-18T06:56:05Z

const transcribe = async (
    audio,
    model,
    multilingual,
    quantized,
    subtask,
    language,
) => {
    // TODO use subtask and language

    //If multilingual is true, it adds an empty string ("") to the model name, effectively leaving it unchanged. If multilingual is false, it appends ".en" to the model name, indicating that the model should be used for English transcription.

    const modelName = `Xenova/whisper-${model}${multilingual ? "" : ".en"}`;
    console.log('modelName',modelName)
    

    const p = AutomaticSpeechRecognitionPipelineFactory;
  

    //// Check if the current model settings are different from the new settings
    if (p.model !== modelName || p.quantized !== quantized) {
        // Invalidate model if different
        // Update the model name and quantized status
        p.model = modelName;
        p.quantized = quantized;

        // Check if there is an existing instance of the ASR pipeline
        if (p.instance !== null) {

            // Dispose of the existing instance (clean up resources)
            (await p.getInstance()).dispose();


            // Set the instance to null (indicating that it needs to be recreated)
            p.instance = null;
        }
    }

    // Load transcriber model
    let transcriber = await p.getInstance((data) => {
        self.postMessage(data);
    });

    const time_precision =
        transcriber.processor.feature_extractor.config.chunk_length /
        transcriber.model.config.max_source_positions;

    // Storage for chunks to be processed. Initialise with an empty chunk.
    let chunks_to_process = [
        {
            tokens: [],
            finalised: false,
        },
    ];

    // TODO: Storage for fully-processed and merged chunks
    // let decoded_chunks = [];

    function chunk_callback(chunk) {
        let last = chunks_to_process[chunks_to_process.length - 1];

        // Overwrite last chunk with new info
        Object.assign(last, chunk);
        last.finalised = true;

        // Create an empty chunk after, if it not the last chunk
        if (!chunk.is_last) {
            chunks_to_process.push({
                tokens: [],
                finalised: false,
            });
        }
    }

    // Inject custom callback function to handle merging of chunks
    function callback_function(item) {
        let last = chunks_to_process[chunks_to_process.length - 1];

        // Update tokens of last chunk
        last.tokens = [...item[0].output_token_ids];

        // Merge text chunks
        // TODO optimise so we don't have to decode all chunks every time
        let data = transcriber.tokenizer._decode_asr(chunks_to_process, {
            time_precision: time_precision,
            return_timestamps: true,
            force_full_sequences: false,
        });

        self.postMessage({
            status: "update",
            task: "automatic-speech-recognition",
            data: data,
        });
    }

    // Actually run transcription
    let output = await transcriber(audio, {
        // Greedy
        top_k: 0,
        do_sample: false,

        // Sliding window
        chunk_length_s: 30,
        stride_length_s: 5,

        // Language and task
        language: language,
        task: subtask,

        // Return timestamps
        return_timestamps: true,
        force_full_sequences: false,

        // Callback functions
        callback_function: callback_function, // after each generation step
        chunk_callback: chunk_callback, // after each chunk is processed
    }).catch((error) => {
        
        self.postMessage({
            status: "error",
            task: "automatic-speech-recognition",
            data: error,
        });
        return null;
    });

    return output;
};

rojitdhakal · 2023-09-18T09:13:28Z

  static async getInstance(progress_callback = null) {
        
        if (this.instance === null) {
            this.instance = pipeline(this.task, this.model, {
                quantized: this.quantized,
                progress_callback,
            });
        }
        console.log("inside",this.instance)
        return this.instance;
    }    '

while consoling this.instances it shows

   Promise {<pending>}
[[Prototype]]
: 
Promise
[[PromiseState]]
: 
"rejected"
[[PromiseResult]]
: 
Error: Unsupported model type: whisper at AutoModelForCTC.from_pretrained (webpack-internal:///./node_modules/.pnpm/@xenova+transformers@2.6.0/node_modules/@xenova/transformers/src/models.js:3550:19) at async eval (webpack-internal:///./node_modules/.pnpm/@xenova+transformers@2.6.0/node_modules/@xenova/transformers/src/pipelines.js:2087:33)
message
: 
"Unsupported model type: whisper"
stack
: 
"Error: Unsupported model type: whisper\n    at AutoModelForCTC.from_pretrained (webpack-internal:///./node_modules/.pnpm/@[email protected]/node_modules/@xenova/transformers/src/models.js:3550:19)\n    at async eval (webpack-internal:///./node_modules/.pnpm/@[email protected]/node_modules/@xenova/transformers/src/pipelines.js:2087:33)"

xenova · 2023-09-18T13:46:42Z

Hi there. I believe this is due to an issue we just fixed in v2.6.1 (related to minification). Could you please upgrade to v2.6.1 and try again? Thanks!

rojitdhakal · 2023-09-19T04:25:37Z

I just upgraded v2.6.1 again the same error persists??

rojitdhakal · 2023-09-19T04:51:52Z

rojitdhakal · 2023-09-19T04:52:24Z

xenova · 2023-09-19T10:36:30Z

Could you please post information about your environment, e.g., OS, browser, built tools?

I am aware of a similar issue with users that use create-react-app, and if this is the case, please switch to a more up-to-date build tool like Vite.

rojitdhakal · 2023-09-19T11:22:07Z

OS: Windows 11
Browser: Chrome-117.0.5938.89
build tools: create-next-app

xenova · 2023-09-19T11:26:02Z

build tools: create-next-app

Please try using Vite for your project. CRA has been removed from the React documentation. See here for more information.

rojitdhakal · 2023-09-19T11:35:36Z

we are using next JS ? There is no any support Vite for next js apllication

xenova · 2023-09-19T11:39:15Z

Oh my apologies, I misread "create-next-app" as "create-react-app". Sorry about that!

Could you post any information about your build process, such as any minification taking place?

rojitdhakal · 2023-09-19T11:42:08Z

I am facing this locally in development server without minification .

xenova · 2023-09-19T11:44:49Z

Do you perhaps have a repo where I can try reproduce this? Or could you post your next.config.js? Thanks!

rojitdhakal · 2023-09-19T11:48:32Z

We are currently working in the private repo. We will share the repo later if required, need to prepare for that , but Now Here's the next config

/** @type {import('next').NextConfig} */

const nextConfig = {
  reactStrictMode: true,
  compress: false,

  images: {
    loader: "akamai",
    path: "",
  },
  compiler: {
    // Enables the styled-components SWC transform
    styledComponents: true,
  },
  // lessLoaderOptions: {
  //   lessOptions: {
  //     javascriptEnabled: true,
  //   },
  // },
  webpack(config) {
    config.module.rules.push({
      test: /\.svg$/,
      use: ["@svgr/webpack"],
    });
    return config;
  },
};

module.exports = nextConfig;

xenova · 2023-09-19T11:55:06Z

And which version of node / next.js / npm are you using?

rojitdhakal · 2023-09-19T12:03:03Z

next-version:13.4.13
node-version:16.15.0
pnpm-version :7.23.0

xenova · 2023-09-19T12:04:57Z

node-version:16.15.0

This might be the issue. In the docs, we recommend using a minimum node version of 18. 16.X has reached EOL. Could you try upgrade?

szprytny · 2023-10-01T20:01:16Z

I tried to run whisper model via automatic-speech-recognition pipeline and got same error caused by unsupported AutoModelForCTC, this PR might have introduced bug:
https://github.com/xenova/transformers.js/pull/220/files?file-filters%5B%5D=.js&show-viewed-files=true#diff-2f6b66f61363f7b45e1b165f81d3ce15b3768da43e40410085aee8bd8666a629R1739

xenova · 2023-10-02T09:55:32Z

@szprytny Could you provide more information about your environment? Are you using the latest version of Transformers.js?

szprytny · 2023-10-02T12:13:19Z

I have
node 18.9.1
transformers.js 2.6.2
When I removed declaration of AutoModelForCTC from https://github.com/xenova/transformers.js/blob/main/src/pipelines.js#L1953

Pipeline went further. I got error Unsupported model IR version: 9 which I was able to pass by overriding onnxruntime-node in my project's package.json

xenova · 2023-10-02T12:41:26Z

And which bundler are you using? I am aware of issues with create-react-app. I haven't had any problems with vite, for example.

I got error Unsupported model IR version: 9

Yes this is because you exported with onnx >= 14, and Transformers.js still uses onnxruntime-web v1.14 (which only supports a max IR version of 8). See here for an issue I files a while ago.

szprytny · 2023-10-02T13:05:00Z

I did not run it as a web-app, I just tried to do inference using plain node script running with npx tsx

xenova · 2023-10-02T13:09:05Z

@szprytny Can you provide some sample code which resulted in this error?

szprytny · 2023-10-02T13:42:58Z

It seems that error

Unsupported model type: whisper

is misleading as the real problem was my model have newer IR version.
It seems that error related to this is not handled well enough and results in calling from_pretrained for AutoModelForCTC class in loadItems function

Here is the script I used to run it

import { WaveFile } from "wavefile";
import path from "path";
import { readFileSync } from "fs";
import { pipeline, env } from "@xenova/transformers";

env.localModelPath = "c:/model/onnx/";

const prepareAudio = (filePath: string): Float64Array => {
  const wav = new WaveFile(readFileSync(path.normalize(filePath)));
  wav.toBitDepth("32f");
  wav.toSampleRate(16000);
  let audioData = wav.getSamples();

  return audioData;
};

const test = async () => {
  let pipe = await pipeline("automatic-speech-recognition", "shmisper", {
    local_files_only: true,
  });

  let out = await pipe(prepareAudio("c:/content/01_0.wav"));
  console.log(out);
};

test();

xenova · 2023-10-02T14:48:20Z

I see... Indeed, that error message would be quite misleading. Could you try downgrade to onnx==1.13.1 and re-export your model? See https://github.com/xenova/transformers.js/blob/main/scripts/requirements.txt for the other recommended versions.

Keith-Hon · 2023-10-25T09:08:51Z

I have the extact same problem. I changed the onnx version to 1.13.1. Small model works but not medium and large-v2 models

dmmagdal · 2023-12-11T22:19:39Z

Having same issue as main thread:

OSX 14.1 Sonoma
M2 chip
Node 18.12.1
transformers.js 2.10.1

You mentioned here that we should use onnx==1.13.1 per your conversion scripts. Does Huggingface's Optimum conversion script (ie optimum-cli export onnx --model model_id also work with your script? I noticed it doesnt move all the ONNX files to their own folder (something I can do manually), but is the conversion processes of exporting to ONNX the same? If so, is optimum-cli using a different version of onnx than what your repo is using?

xenova · 2023-12-11T22:23:50Z

Yes, we use optimum behind the scenes. The purpose of the conversion script is to also perform quantization afterwards, but if this is not necessary for your use-case, you can use optimum directly and just structure the repo as the other transformers.js models on the HF Hub.

dmmagdal · 2023-12-13T17:03:13Z

I converted the whisper-base model to onnx using optimum-cli and moved the model files to the onnx folder locally and verified my env had the same modules from your requirements.txt version. Why I tried to run my inference script (NodeJS) here I still end up with errors output.txt

itsyoboieltr · 2024-07-23T19:57:22Z

@xenova I could reproduce this error on the v3 branch with the example whisper-word-timestamps. If I go to worker.js and change the model_id from onnx-community/whisper-base_timestamped to Xenova/whisper-large-v3 I get the error: Unsupported model type: whisper

nsenkevich · 2024-08-26T17:39:43Z

same,

when trying to use distil-whisper/distil-medium.en on Whisper WebGPU Unsupported model type: whisper "@huggingface/transformers": "^3.0.0-alpha.9",

rojitdhakal added the bug Something isn't working label Sep 18, 2023

rojitdhakal changed the title ~~Unsupported model type: whisper~~ Unsupported model type: whisper and CORS error Sep 18, 2023

timothycarambat mentioned this issue Jan 5, 2024

Error: Unsupported model type: whisper Mintplex-Labs/anything-llm#539

Closed

xenova mentioned this issue Mar 11, 2024

🚀🚀🚀 Transformers.js V3 🚀🚀🚀 #545

Merged

13 tasks

timothycarambat mentioned this issue Apr 21, 2024

[BUG]: failed to load the native whisper model Mintplex-Labs/anything-llm#1157

Closed

xenova closed this as completed in d8b318d Oct 18, 2024

xenova closed this as completed in #545 Oct 18, 2024

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Unsupported model type: whisper and CORS error #314

Unsupported model type: whisper and CORS error #314

rojitdhakal commented Sep 18, 2023 •

edited by xenova

Loading

rojitdhakal commented Sep 18, 2023 •

edited by xenova

Loading

xenova commented Sep 18, 2023

rojitdhakal commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023 •

edited

Loading

xenova commented Sep 19, 2023 •

edited

Loading

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

szprytny commented Oct 1, 2023

xenova commented Oct 2, 2023

szprytny commented Oct 2, 2023

xenova commented Oct 2, 2023

szprytny commented Oct 2, 2023

xenova commented Oct 2, 2023

szprytny commented Oct 2, 2023 •

edited

Loading

xenova commented Oct 2, 2023

Keith-Hon commented Oct 25, 2023 •

edited

Loading

dmmagdal commented Dec 11, 2023

xenova commented Dec 11, 2023

dmmagdal commented Dec 13, 2023

itsyoboieltr commented Jul 23, 2024

nsenkevich commented Aug 26, 2024 •

edited

Loading

Unsupported model type: whisper and CORS error #314

Unsupported model type: whisper and CORS error #314

Comments

rojitdhakal commented Sep 18, 2023 • edited by xenova Loading

rojitdhakal commented Sep 18, 2023 • edited by xenova Loading

xenova commented Sep 18, 2023

rojitdhakal commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023 • edited Loading

xenova commented Sep 19, 2023 • edited Loading

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

rojitdhakal commented Sep 19, 2023

xenova commented Sep 19, 2023

szprytny commented Oct 1, 2023

xenova commented Oct 2, 2023

szprytny commented Oct 2, 2023

xenova commented Oct 2, 2023

szprytny commented Oct 2, 2023

xenova commented Oct 2, 2023

szprytny commented Oct 2, 2023 • edited Loading

xenova commented Oct 2, 2023

Keith-Hon commented Oct 25, 2023 • edited Loading

dmmagdal commented Dec 11, 2023

xenova commented Dec 11, 2023

dmmagdal commented Dec 13, 2023

itsyoboieltr commented Jul 23, 2024

nsenkevich commented Aug 26, 2024 • edited Loading

rojitdhakal commented Sep 18, 2023 •

edited by xenova

Loading

rojitdhakal commented Sep 18, 2023 •

edited by xenova

Loading

rojitdhakal commented Sep 19, 2023 •

edited

Loading

xenova commented Sep 19, 2023 •

edited

Loading

szprytny commented Oct 2, 2023 •

edited

Loading

Keith-Hon commented Oct 25, 2023 •

edited

Loading

nsenkevich commented Aug 26, 2024 •

edited

Loading