diff --git a/docs/source/model_doc/speech_to_text_2.mdx b/docs/source/model_doc/speech_to_text_2.mdx index 62509b67ec32..72754b67aab9 100644 --- a/docs/source/model_doc/speech_to_text_2.mdx +++ b/docs/source/model_doc/speech_to_text_2.mdx @@ -69,7 +69,7 @@ predicted token ids. >>> ds = ds.map(map_to_array) >>> inputs = processor(ds["speech"][0], sampling_rate=16_000, return_tensors="pt") ->>> generated_ids = model.generate(input_ids=inputs["input_values"], attention_mask=inputs["attention_mask"]) +>>> generated_ids = model.generate(inputs=inputs["input_values"], attention_mask=inputs["attention_mask"]) >>> transcription = processor.batch_decode(generated_ids) ```