gradio>=5.0,<6.0 huggingface-hub>=0.15.1 accelerate>=0.22.0 protobuf<4 # llama-cpp-python removed to avoid compile