File size: 388 Bytes
ea8c646
13d172f
 
ef3cbd4
7b0e04c
ea8c646
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
# Hugging Face core libraries
transformers
huggingface_hub
accelerate
fastvideo

# Qwen Omni helper (handles multimodal processing)
qwen-omni-utils[decord]

# PyTorch (for model execution)
torch
torchvision
torchaudio

# UI with chat interface
gradio

# Audio file writing (used for speech output)
soundfile

# Video/audio decoding
ffmpeg-python
decord
moviepy

# Utility libraries
numpy