Spaces:

Hemasagar
/

Email_or_text_generator

Runtime error

Hemasagar commited on May 30

Commit

7c57aa9

•

1 Parent(s): 9aca64d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,8 +7,11 @@ import transformers
 # model_from_hugging_face = transformers.pipeline("text-generation", model="TheBloke/Llama-2-7B-Chat-GGML")
 # Load model directly
-from transformers import AutoModel
-model_from_hugging_face = AutoModel.from_pretrained("TheBloke/Llama-2-7B-Chat-GGML")
 # # from langchain.llms import CTransformers
 # from langchain_community.llms import CTransformers
@@ -27,10 +30,7 @@ def getLLMResponse(form_input,email_sender,email_recipient,email_style):
     #C Transformers is the Python library that provides bindings for transformer models implemented in C/C++ using the GGML library
-    llm = CTransformers(model_from_hugging_face, # models/llama-2-7b-chat.ggmlv3.q8_0.bin,     #https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGML/tree/main
-                    model_type='llama',
-                    config={'max_new_tokens': 256,
-                            'temperature': 0.01})
     #Template for building the PROMPT

 # model_from_hugging_face = transformers.pipeline("text-generation", model="TheBloke/Llama-2-7B-Chat-GGML")
 # Load model directly
+# with ctransformers, you can load from Hugging Face Hub directly and specify a model file (.bin or .gguf files) using:
+from ctransformers import AutoModelForCausalLM
+llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGML", model_file="llama-2-7b-chat.ggmlv3.q8_0.bin")
 # # from langchain.llms import CTransformers
 # from langchain_community.llms import CTransformers
     #C Transformers is the Python library that provides bindings for transformer models implemented in C/C++ using the GGML library
+    llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGML", model_file="llama-2-7b-chat.ggmlv3.q8_0.bin")
     #Template for building the PROMPT