Spaces:

audrito
/

Lily

Paused

audrito commited on Nov 24, 2023

Commit

e9e8562

•

1 Parent(s): ba3e48c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,15 +7,14 @@ description = "This is a demo of Synthia 7B GGUF running on spaces cpu basic har
 model_path = "models"
 model_name = "synthia-7b-v2.0-16k.Q4_K_M.gguf"
-hf_hub_download(repo_id="TheBloke/SynthIA-7B-v2.0-16k-GGUF", filename=model_name, local_dir=model_path, local_dir_use_symlinks=False)
 try:
-    model = GPT4All(model_name, model_path, allow_download=False, device="cpu")
     print("Model loaded successfully.")
 except Exception as e:
     print("Error loading the model:", str(e))
 model.config["promptTemplate"] = "[INST] {0} [/INST]"
 model.config["systemPrompt"] = ""
 model._is_chat_session_activated = False
@@ -31,9 +30,7 @@ def generater(message, history, temperature, top_p, top_k):
     outputs = []
     for token in model.generate(prompt=prompt, temp=temperature, top_k = top_k, top_p = top_p, max_tokens = max_new_tokens, streaming=True):
         outputs.append(token)
-        yield "".join(outputs)
 def vote(data: gr.LikeData):
     if data.liked:
@@ -93,7 +90,7 @@ iface = gr.ChatInterface(
 with gr.Blocks(css="resourse/style/custom.css") as demo:
     chatbot.like(vote, None, None)
-    iface.render()
 if __name__ == "__main__":
     demo.queue(max_size=3).launch()

 model_path = "models"
 model_name = "synthia-7b-v2.0-16k.Q4_K_M.gguf"
+model_path = hf_hub_download(repo_id="TheBloke/SynthIA-7B-v2.0-16k-GGUF", filename=model_name, local_dir=model_path, local_dir_use_symlinks=False)
 try:
+    model = GPT4All(model_path, allow_download=False, device="cpu")
     print("Model loaded successfully.")
 except Exception as e:
     print("Error loading the model:", str(e))
 model.config["promptTemplate"] = "[INST] {0} [/INST]"
 model.config["systemPrompt"] = ""
 model._is_chat_session_activated = False
     outputs = []
     for token in model.generate(prompt=prompt, temp=temperature, top_k = top_k, top_p = top_p, max_tokens = max_new_tokens, streaming=True):
         outputs.append(token)
+    return "".join(outputs)
 def vote(data: gr.LikeData):
     if data.liked:
 with gr.Blocks(css="resourse/style/custom.css") as demo:
     chatbot.like(vote, None, None)
+    iface.launch()
 if __name__ == "__main__":
     demo.queue(max_size=3).launch()