import gradio as gr
from transformers import pipeline

model = pipeline('automatic-speech-recognition', model='facebook/wav2vec2-base-960h')

def audiototext(audio):
    text = model(audio)['text']
    return text

gr.Interface(
    fn=audiototext,
    inputs=gr.Audio(source="upload", type="filepath"),
    outputs=["textbox"],
    examples = ['Hey_Siri.wav', 'Martin.mp3','download.wav','30_Second_Song.mp3'],
    title = "AUDIO TO TEXT CONVERSION"
).launch()