DMOSpeech2 / requirements.txt
mrfakename's picture
pt 1
597cecf
raw
history blame contribute delete
665 Bytes
# Main dependencies
accelerate>=0.33.0
# Note: bitsandbytes has platform restrictions - not for arm64 or Darwin (macOS)
bitsandbytes>0.37.0
cached_path
click
datasets
ema_pytorch>=0.5.2
gradio>=3.45.2
hydra-core>=1.3.0
jieba
librosa
matplotlib
numpy<=1.26.4
pydantic<=2.10.6
pydub
pypinyin
safetensors
soundfile
tomli
torch>=2.0.0
torchaudio>=2.0.0
torchdiffeq
tqdm>=4.65.0
transformers
transformers_stream_generator
unidecode
vocos
wandb
x_transformers>=1.31.14
# Optional dependencies for evaluation
# Uncomment if you need eval features:
# faster_whisper==0.10.1
# funasr
# jiwer
# modelscope
# zhconv
# zhon
cached_path