torch==2.4.0 fastapi==0.88.0 huggingface_hub==0.32.4 json5==0.9.25 numpy uvicorn optimum[onnxruntime-gpu]==1.25.3 transformers==4.51.3