voice-to-code-backend / whisper_model.py
ShobhitKori
Updated codet5_model.py
62522ae
raw
history blame contribute delete
649 Bytes
import os
import whisper
import logging
# Add FFmpeg directory to PATH
# os.environ["PATH"] += os.pathsep + r"C:\ffmpeg\bin"
WHISPER_MODEL_DIR = "./data/whisper-small"
os.makedirs(WHISPER_MODEL_DIR, exist_ok=True)
model = whisper.load_model("small", download_root=WHISPER_MODEL_DIR)
# def transcribe_audio(file_path: str) -> str:
# result = model.transcribe(file_path)
# return result["text"]
logging.basicConfig(level=logging.INFO)
def transcribe_audio(file_path):
logging.info("Starting transcription for %s", file_path)
result = model.transcribe(file_path)
logging.info("Transcription completed")
return result["text"]