gradio>=5.0,<6.0
huggingface-hub>=0.15.1
accelerate>=0.22.0
protobuf<4
# llama-cpp-python removed to avoid compile