gradio>=4.0.0 torch>=2.0.0 transformers>=4.36.0 huggingface_hub>=0.20.0 llama-cpp-python>=0.2.0 python-dotenv accelerate huggingface-hub protobuf sentencepiece gguf hf_xet pillow