Spaces:

zhangtao103239
/

NeuralHermes-2.5-Mistral-7B-GGUF-Chat

Sleeping

App Files Files Community

zhangtao commited on Dec 27, 2023

Commit

728ac62

•

1 Parent(s): 5b3edb5

增加中文翻译功能

Browse files

Files changed (2) hide show

Dockerfile +2 -0
app.py +82 -25

Dockerfile CHANGED Viewed

@@ -7,6 +7,8 @@ WORKDIR /code
 RUN wget https://huggingface.co/TheBloke/NeuralHermes-2.5-Mistral-7B-GGUF/resolve/main/neuralhermes-2.5-mistral-7b.Q5_K_M.gguf?download=true -O neuralhermes-2.5-mistral-7b.Q5_K_M.gguf
 COPY ./requirements.txt /code/requirements.txt
 RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt

 RUN wget https://huggingface.co/TheBloke/NeuralHermes-2.5-Mistral-7B-GGUF/resolve/main/neuralhermes-2.5-mistral-7b.Q5_K_M.gguf?download=true -O neuralhermes-2.5-mistral-7b.Q5_K_M.gguf
+RUN wget https://huggingface.co/zhangtao103239/Qwen-1.8B-GGUF/resolve/main/qwen-1.8b-q5_k_m.gguf?download=true -O qwen-1.8b-q5_k_m.gguf
 COPY ./requirements.txt /code/requirements.txt
 RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt

app.py CHANGED Viewed

@@ -1,45 +1,102 @@
 import gradio as gr
 from llama_cpp import Llama
 import json
 llm = Llama(model_path="./neuralhermes-2.5-mistral-7b.Q5_K_M.gguf",
-            n_ctx=32768,
             n_threads=2,
             chat_format="chatml")
-def chat_completion(messages, history, system_prompt):
     messages_prompts = [{"role": "system", "content": system_prompt}]
     for human, assistant in history:
         messages_prompts.append({"role": "user", "content": human})
         messages_prompts.append({"role": "assistant", "content": assistant})
-    messages_prompts.append({"role": "user", "content": messages})
     response = llm.create_chat_completion(
         messages=messages_prompts,
         stream=False
     )
     print(json.dumps(response, ensure_ascii=False, indent=2))
-    return response['choices'][0]['content']
-def chat_stream_completion(messages, history, system_prompt):
     messages_prompts = [{"role": "system", "content": system_prompt}]
-    for human, assistant in history:
-        messages_prompts.append({"role": "user", "content": human})
-        messages_prompts.append({"role": "assistant", "content": assistant})
-    messages_prompts.append({"role": "user", "content": messages})
-    response = llm.create_chat_completion(
-        messages=messages_prompts,
-        stream=True
-    )
-    partial_message = ""
-    for chunk in response:
-        if len(chunk['choices'][0]["delta"]) != 0 and "content" in chunk['choices'][0]["delta"]:
-            partial_message = partial_message + \
-                chunk['choices'][0]["delta"]["content"]
-        yield partial_message
-gr.ChatInterface(chat_stream_completion,
-                 additional_inputs=[gr.Textbox(
-                     "You are helpful AI.", label="System Prompt")]
-                 ).queue().launch(server_name="0.0.0.0")

 import gradio as gr
 from llama_cpp import Llama
 import json
+import time
 llm = Llama(model_path="./neuralhermes-2.5-mistral-7b.Q5_K_M.gguf",
+            n_ctx=1024,
             n_threads=2,
             chat_format="chatml")
+llm_for_translate = Llama(model_path="./qwen-1.8b-q5_k_m.gguf",
+            n_ctx=1024,
+            n_threads=2,
+            chat_format="chatml")
+chi_eng_dict = []
+def get_dict_result(original_text):
+    for d in chi_eng_dict:
+        if d[0] == original_text:
+            return d[1]
+        elif d[1] == original_text:
+            return d[0]
+    return None
+def stream_translate_into(message, language='English'):
+    return llm.create_chat_completion(
+        messages=[{"role": "system", "content": f"Translate words into {language}. Regardless the meanning!"},
+                    {"role": "user", "content": f"'{message}'"}],
+        stream=True,
+        stop=['\n\n']
+    )
+def chat_completion(message, history, system_prompt):
     messages_prompts = [{"role": "system", "content": system_prompt}]
     for human, assistant in history:
         messages_prompts.append({"role": "user", "content": human})
         messages_prompts.append({"role": "assistant", "content": assistant})
+    messages_prompts.append({"role": "user", "content": message})
     response = llm.create_chat_completion(
         messages=messages_prompts,
         stream=False
     )
     print(json.dumps(response, ensure_ascii=False, indent=2))
+    return response['choices'][0]['message']['content']
+def chat_stream_completion(message, history, system_prompt, translate_check):
     messages_prompts = [{"role": "system", "content": system_prompt}]
+    if translate_check:
+        if len(history) > 0:
+            for human, assistant in history:
+                human_repl = get_dict_result(human)
+                assistant_repl = get_dict_result(assistant)
+                if human_repl is None or assistant_repl is None:
+                    print(chi_eng_dict)
+                    raise gr.Error("历史信息缺少翻译字典，请勿中途修改翻译功能！")
+                messages_prompts.append({"role": "user", "content": human_repl})
+                messages_prompts.append({"role": "assistant", "content": assistant_repl})
+        message_repl = ""
+        for chunk in stream_translate_into(message, language='English'):
+            if len(chunk['choices'][0]["delta"]) != 0 and "content" in chunk['choices'][0]["delta"]:
+                message_repl = message_repl + \
+                    chunk['choices'][0]["delta"]["content"]
+        chi_eng_dict.append((message, message_repl))
+        messages_prompts.append({"role": "user", "content": message_repl})
+        print(messages_prompts)
+        response = llm.create_chat_completion(
+            messages=messages_prompts,
+            stream=False,
+            stop=['\n\n']
+        )
+        print(json.dumps(response, ensure_ascii=False, indent=2))
+        result = response['choices'][0]['message']['content']
+        result_repl = ""
+        for chunk in stream_translate_into(result, language='Chinese'):
+            if len(chunk['choices'][0]["delta"]) != 0 and "content" in chunk['choices'][0]["delta"]:
+                result_repl = result_repl + \
+                    chunk['choices'][0]["delta"]["content"]
+                yield result_repl
+        chi_eng_dict.append((result, result_repl))
+    else:
+        for human, assistant in history:
+            messages_prompts.append({"role": "user", "content": human})
+            messages_prompts.append({"role": "assistant", "content": assistant})
+        messages_prompts.append({"role": "user", "content": message})
+        response = llm.create_chat_completion(
+            messages=messages_prompts,
+            stream=True
+        )
+        message_repl = ""
+        for chunk in response:
+            if len(chunk['choices'][0]["delta"]) != 0 and "content" in chunk['choices'][0]["delta"]:
+                message_repl = message_repl + \
+                    chunk['choices'][0]["delta"]["content"]
+            yield message_repl
+gr.ChatInterface(
+    chat_stream_completion,
+    additional_inputs=[gr.Textbox(
+        "You are helpful AI.", label="System Prompt"), gr.Checkbox(label="Translate?")]
+).queue().launch(server_name="0.0.0.0")