fastapi uvicorn[standard] llama_cpp_python[server]==0.2.59 huggingface-hub transformers tensorflow[and-cuda]