File size: 1,117 Bytes
b3a5734
fae09c1
 
dda982a
4fab3b3
 
 
 
 
b3a5734
f7427de
4fab3b3
b3a5734
 
dda982a
 
b3a5734
fae09c1
b3a5734
98482ce
 
 
4fab3b3
 
 
 
 
 
dbdd7c8
 
 
 
033e4ba
 
c0c51c2
 
575f1c7
 
 
 
 
 
 
 
21c909d
575f1c7
21c909d
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
# Core dependencies
pydantic==2.10.6
gradio
markdown==3.7
pillow  # Match exact dependency from GOT-OCR
numpy==1.26.3  # Match exact dependency from GOT-OCR

# For ZeroGPU support
spaces

# Image processing
opencv-python  # Match exact dependency from GOT-OCR

# Utility dependencies
python-dotenv>=1.0.0

# Gemini API client
google-genai==1.5.0

# Mistral AI client
mistralai>=1.0.0

# GOT-OCR dependencies - exactly as in original
torch
torchvision
git+https://github.com/huggingface/transformers.git@main
accelerate
verovio  # Added missing dependency
huggingface_hub[cli]>=0.19.0

# MarkItDown and its dependencies
markitdown[all]
ffmpeg-python  # For audio processing in MarkItDown
# Note: Using Gemini Flash 2.5 for LLM image descriptions instead of OpenAI

# Docling dependencies
docling

# RAG and LangChain dependencies
langchain>=0.3.0
langchain-openai>=0.2.0
langchain-google-genai>=2.0.0
langchain-chroma>=0.1.0
langchain-text-splitters>=0.3.0
langchain-community>=0.3.0  # For BM25Retriever and EnsembleRetriever
chromadb>=0.5.0
sentence-transformers>=3.0.0
rank-bm25>=0.2.0  # Required for BM25Retriever