Spaces:

MakiAi
/

BOREA_DEMO

Sleeping

App Files Files Community

MakiAi commited on Sep 14, 2024

Commit

6480777

verified ·

1 Parent(s): f713d11

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -18

app.py CHANGED Viewed

@@ -6,19 +6,21 @@ from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStream
 import gradio as gr
 from threading import Thread
 MODELS = {
-    "Phi-3.5-mini": "microsoft/Phi-3.5-mini-instruct",
     "Borea-Phi-3.5-mini-Jp": "AXCXEPT/Borea-Phi-3.5-mini-Instruct-Jp",
-    "EZO-Common-9B": "HODACHI/EZO-Common-9B-gemma-2-it"
 }
 HF_TOKEN = os.environ.get("HF_TOKEN", None)
-TITLE = "<h1><center>Multi-Model Chat Interface</center></h1>"
 PLACEHOLDER = """
 <center>
-<p>Hi, I'm an AI assistant. Ask me anything.</p>
 </center>
 """
@@ -40,7 +42,8 @@ quantization_config = BitsAndBytesConfig(
     load_in_4bit=True,
     bnb_4bit_compute_dtype=torch.bfloat16,
     bnb_4bit_use_double_quant=True,
-    bnb_4bit_quant_type="nf4")
 model = None
 tokenizer = None
@@ -53,7 +56,8 @@ def load_model(model_name):
         model_path,
         torch_dtype=torch.bfloat16,
         device_map="auto",
-        quantization_config=quantization_config)
 @spaces.GPU()
 def stream_chat(
@@ -68,10 +72,10 @@ def stream_chat(
     model_name: str = "Phi-3.5-mini"
 ):
     global model, tokenizer
     if model is None or tokenizer is None or model.name_or_path != MODELS[model_name]:
         load_model(model_name)
     print(f'message: {message}')
     print(f'history: {history}')
@@ -121,22 +125,22 @@ with gr.Blocks(css=CSS, theme='ParityError/Interstellar') as demo:
         fill_height=True,
         additional_inputs=[
             gr.Textbox(
-                value="You are a helpful assistant",
-                label="System Prompt",
             ),
             gr.Slider(
                 minimum=0,
                 maximum=1,
                 step=0.1,
                 value=0.8,
-                label="Temperature",
             ),
             gr.Slider(
                 minimum=128,
                 maximum=8192,
                 step=1,
                 value=1024,
-                label="Max new tokens",
             ),
             gr.Slider(
                 minimum=0.0,
@@ -157,19 +161,19 @@ with gr.Blocks(css=CSS, theme='ParityError/Interstellar') as demo:
                 maximum=2.0,
                 step=0.1,
                 value=1.2,
-                label="Repetition penalty",
             ),
             gr.Dropdown(
                 choices=list(MODELS.keys()),
                 value="Phi-3.5-mini",
-                label="Model",
             ),
         ],
         examples=[
-            ["Help me study vocabulary: write a sentence for me to fill in the blank, and I'll try to pick the correct option."],
-            ["What are 5 creative things I could do with my kids' art? I don't want to throw them away, but it's also so much clutter."],
-            ["Tell me a random fun fact about the Roman Empire."],
-            ["Show me a code snippet of a website's sticky header in CSS and JavaScript."],
         ],
         cache_examples=False,
     )

 import gradio as gr
 from threading import Thread
+# モデルの定義
 MODELS = {
     "Borea-Phi-3.5-mini-Jp": "AXCXEPT/Borea-Phi-3.5-mini-Instruct-Jp",
+    "EZO-Common-9B": "HODACHI/EZO-Common-9B-gemma-2-it",
+    "Phi-3.5-mini": "microsoft/Phi-3.5-mini-instruct",
 }
 HF_TOKEN = os.environ.get("HF_TOKEN", None)
+# タイトルとプレースホルダーを日本語に変更
+TITLE = "<h1><center>Borea/EZO デモアプリ</center></h1>"
 PLACEHOLDER = """
 <center>
+<p>こんにちは、私はAIアシスタントです。何でも質問してください。</p>
 </center>
 """
     load_in_4bit=True,
     bnb_4bit_compute_dtype=torch.bfloat16,
     bnb_4bit_use_double_quant=True,
+    bnb_4bit_quant_type="nf4"
+)
 model = None
 tokenizer = None
         model_path,
         torch_dtype=torch.bfloat16,
         device_map="auto",
+        quantization_config=quantization_config
+    )
 @spaces.GPU()
 def stream_chat(
     model_name: str = "Phi-3.5-mini"
 ):
     global model, tokenizer
     if model is None or tokenizer is None or model.name_or_path != MODELS[model_name]:
         load_model(model_name)
     print(f'message: {message}')
     print(f'history: {history}')
         fill_height=True,
         additional_inputs=[
             gr.Textbox(
+                value="あなたは親切なアシスタントです。",
+                label="システムプロンプト",
             ),
             gr.Slider(
                 minimum=0,
                 maximum=1,
                 step=0.1,
                 value=0.8,
+                label="温度 (Temperature)",
             ),
             gr.Slider(
                 minimum=128,
                 maximum=8192,
                 step=1,
                 value=1024,
+                label="最大新規トークン数",
             ),
             gr.Slider(
                 minimum=0.0,
                 maximum=2.0,
                 step=0.1,
                 value=1.2,
+                label="繰り返しペナルティ",
             ),
             gr.Dropdown(
                 choices=list(MODELS.keys()),
                 value="Phi-3.5-mini",
+                label="モデル選択",
             ),
         ],
         examples=[
+            ["語彙の勉強を手伝ってください。空欄を埋めるための文章を書いてください。私は正しい選択肢を選びます。"],
+            ["子供のアート作品でできる5つの創造的なことを教えてください。捨てたくはないのですが、散らかってしまいます。"],
+            ["ローマ帝国についてのランダムな面白い事実を教えてください。"],
+            ["ウェブサイトの固定ヘッダーのCSSとJavaScriptのコードスニペットを見せてください。"],
         ],
         cache_examples=False,
     )