RAGDEV

Runtime error

alexkueck commited on Nov 30, 2023

Commit

c10830c

1 Parent(s): aa47f31

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -85,7 +85,7 @@ MODEL_NAME  = "gpt-3.5-turbo-16k"
 #HuggingFace--------------------------------
 #repo_id = "meta-llama/Llama-2-13b-chat-hf"
-repo_id = "HuggingFaceH4/zephyr-7b-alpha"
 #repo_id = "meta-llama/Llama-2-70b-chat-hf"
 #repo_id = "tiiuae/falcon-40b"
 #repo_id = "Vicuna-33b"
@@ -304,9 +304,9 @@ def invoke (prompt, history, rag_option, openai_api_key,  temperature=0.9, max_n
         #LLM auswählen (OpenAI oder HF)
         ###########################
         #Anfrage an OpenAI ----------------------------
-        #llm = ChatOpenAI(model_name = MODEL_NAME,  openai_api_key = openai_api_key, temperature=temperature)#, top_p = top_p)
         #oder an Hugging Face --------------------------
-        llm = HuggingFaceHub(repo_id=repo_id, model_kwargs={"temperature": 0.5, "max_length": 64})
         #llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
         #llm = HuggingFaceTextGenInference( inference_server_url="http://localhost:8010/", max_new_tokens=max_new_tokens,top_k=10,top_p=top_p,typical_p=0.95,temperature=temperature,repetition_penalty=repetition_penalty,)

 #HuggingFace--------------------------------
 #repo_id = "meta-llama/Llama-2-13b-chat-hf"
+repo_id = "HuggingFaceH4/zephyr-7b-alpha"   #das Modell ist echt gut!!!
 #repo_id = "meta-llama/Llama-2-70b-chat-hf"
 #repo_id = "tiiuae/falcon-40b"
 #repo_id = "Vicuna-33b"
         #LLM auswählen (OpenAI oder HF)
         ###########################
         #Anfrage an OpenAI ----------------------------
+        llm = ChatOpenAI(model_name = MODEL_NAME,  openai_api_key = openai_api_key, temperature=temperature)#, top_p = top_p)
         #oder an Hugging Face --------------------------
+        #llm = HuggingFaceHub(repo_id=repo_id, model_kwargs={"temperature": 0.5, "max_length": 64})
         #llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
         #llm = HuggingFaceTextGenInference( inference_server_url="http://localhost:8010/", max_new_tokens=max_new_tokens,top_k=10,top_p=top_p,typical_p=0.95,temperature=temperature,repetition_penalty=repetition_penalty,)