LLaMmlein-1B-Chat

Sleeping

JanPf commited on Nov 24, 2024

Commit

586ff4c

verified ·

1 Parent(s): 2ac354d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,6 +13,7 @@ model_name = model_id.split('/')[-1]
 title = f"🇩🇪 {model_name}"
 description = f"Chat with <a href=\"https://huggingface.co/{model_id}\">{model_name}</a> in GGUF format ({quant})!"
 # Initialize the LLM
 llm = Llama(model_path="model.gguf",
             n_ctx=32768,
@@ -20,7 +21,7 @@ llm = Llama(model_path="model.gguf",
             chat_format=chat_template)
 # Function for streaming chat completions
-def chat_stream_completion(message, history, system_prompt):
     #messages_prompts = [{"role": "system", "content": system_prompt}]
     messages_prompts = []
     for human, assistant in history:
@@ -39,6 +40,7 @@ def chat_stream_completion(message, history, system_prompt):
             message_repl = message_repl + chunk['choices'][0]["delta"]["content"]
         yield message_repl
 # Gradio chat interface
 gr.ChatInterface(
     fn=chat_stream_completion,

 title = f"🇩🇪 {model_name}"
 description = f"Chat with <a href=\"https://huggingface.co/{model_id}\">{model_name}</a> in GGUF format ({quant})!"
+print("loading model")
 # Initialize the LLM
 llm = Llama(model_path="model.gguf",
             n_ctx=32768,
             chat_format=chat_template)
 # Function for streaming chat completions
+def chat_stream_completion(message, history):
     #messages_prompts = [{"role": "system", "content": system_prompt}]
     messages_prompts = []
     for human, assistant in history:
             message_repl = message_repl + chunk['choices'][0]["delta"]["content"]
         yield message_repl
+print("starting gradio")
 # Gradio chat interface
 gr.ChatInterface(
     fn=chat_stream_completion,