llama-cpp-python==0.2.55 faiss-cpu transformers sentencepiece accelerate langchain==0.1.11 setfit rapidfuzz peft bitsandbytes huggingface_hub gradio==3.50.2 gradio-client