from transformers import pipeline import gradio as gr model = pipeline("automatic-speech-recognition") def transcribe_audio(audio): transcription = model(audio)["text"] return transcription gr.Interface( fn=transcribe_audio, inputs=gr.Audio(type="filepath"), outputs="text", ).launch(debug=True)