from transformers import pipeline with open("mlk.flac", "rb") as f: data = f.read() pipe = pipeline("automatic-speech-recognition", "openai/whisper-large-v2") pipe("mlk.flac") # {'text': "GOING ALONG SLUSHY COUNTRY ROADS AND SPEAKING TO DAMP AUDIENCES IN DRAUGHTY SCHOOL ROOMS DAY AFTER DAY FOR A FORTNIGHT HE'LL HAVE TO PUT IN AN APPEARANCE AT SOME PLACE OF WORSHIP ON SUNDAY MORNING AND HE CAN COME TO US IMMEDIATELY AFTERWARDS"}