File size: 6,328 Bytes
f9b9d56 83ee74c 574f73e 705c5b5 83ee74c f9b9d56 ad9db85 7ddfb78 ad9db85 f9b9d56 705c5b5 0997082 705c5b5 0997082 d57197f ad9db85 7ffca43 705c5b5 7ffca43 705c5b5 d57197f 0997082 705c5b5 83ee74c 0997082 ad9db85 f2c0975 83ee74c 0997082 83ee74c 7ffca43 705c5b5 d57197f 0997082 7ffca43 d57197f 705c5b5 7b3fa19 7ffca43 7b3fa19 f86099a 7b3fa19 63c5e29 ad9db85 7ffca43 63c5e29 ad9db85 7ffca43 f86099a d57197f 7ffca43 63c5e29 f86099a 63c5e29 7ffca43 ad9db85 7ffca43 ad9db85 7ffca43 63c5e29 f9b9d56 63c5e29 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 |
import gradio as gr
from huggingface_hub import InferenceClient
import os
import pandas as pd
from typing import List, Tuple
# LLM λͺ¨λΈ μ μ
LLM_MODELS = {
"Default": "CohereForAI/c4ai-command-r-plus-08-2024", # κΈ°λ³Έ λͺ¨λΈ
"Meta": "meta-llama/Llama-3.3-70B-Instruct",
"Mistral": "mistralai/Mistral-Nemo-Instruct-2407",
"Alibaba": "Qwen/QwQ-32B-Preview"
}
def get_client(model_name):
return InferenceClient(LLM_MODELS[model_name], token=os.getenv("HF_TOKEN"))
def read_uploaded_file(file):
if file is None:
return ""
try:
if file.name.endswith('.parquet'):
df = pd.read_parquet(file.name, engine='pyarrow')
return df.head(10).to_markdown(index=False)
else:
content = file.read()
if isinstance(content, bytes):
return content.decode('utf-8')
return content
except Exception as e:
return f"νμΌμ μ½λ μ€ μ€λ₯κ° λ°μνμ΅λλ€: {str(e)}"
def format_history(history):
formatted_history = []
for user_msg, assistant_msg in history:
formatted_history.append({"role": "user", "content": user_msg})
if assistant_msg:
formatted_history.append({"role": "assistant", "content": assistant_msg})
return formatted_history
def chat(message, history, uploaded_file, model_name, system_message="", max_tokens=4000, temperature=0.7, top_p=0.9):
system_prefix = """λ°λμ νκΈλ‘ λ΅λ³ν κ². λλ μ£Όμ΄μ§ μμ€μ½λλ λ°μ΄ν°λ₯Ό κΈ°λ°μΌλ‘ "μλΉμ€ μ¬μ© μ€λͺ
λ° μλ΄, Q&Aλ₯Ό νλ μν μ΄λ€". μμ£Ό μΉμ νκ³ μμΈνκ² 4000ν ν° μ΄μ Markdown νμμΌλ‘ μμ±νλΌ. λλ μ
λ ₯λ λ΄μ©μ κΈ°λ°μΌλ‘ μ¬μ© μ€λͺ
λ° μ§μ μλ΅μ μ§ννλ©°, μ΄μ©μμκ² λμμ μ£Όμ΄μΌ νλ€. μ΄μ©μκ° κΆκΈν΄ ν λ§ν λ΄μ©μ μΉμ νκ² μλ €μ£Όλλ‘ νλΌ. μ 체 λ΄μ©μ λν΄μλ 보μμ μ μ§νκ³ , ν€ κ° λ° μλν¬μΈνΈμ ꡬ체μ μΈ λͺ¨λΈμ 곡κ°νμ§ λ§λΌ."""
if uploaded_file:
content = read_uploaded_file(uploaded_file)
file_extension = os.path.splitext(uploaded_file.name)[1].lower()
if file_extension == '.parquet':
system_message += f"\n\nνμΌ λ΄μ©:\n```markdown\n{content}\n```"
else:
system_message += f"\n\nνμΌ λ΄μ©:\n```python\n{content}\n```"
if message == "νμΌ λΆμμ μμν©λλ€.":
message = """μ
λ‘λλ νμΌμ λΆμνμ¬ λ€μ λ΄μ©μ ν¬ν¨νμ¬ μμΈν μ€λͺ
νλΌ:
1. νμΌμ μ£Όμ λͺ©μ κ³Ό κΈ°λ₯
2. μ£Όμ νΉμ§κ³Ό ꡬμ±μμ
3. νμ© λ°©λ² λ° μ¬μ© μλ리μ€
4. μ£Όμμ¬ν λ° μ νμ¬ν
5. κΈ°λν¨κ³Ό λ° μ₯μ """
messages = [{"role": "system", "content": f"{system_prefix} {system_message}"}]
messages.extend(format_history(history))
messages.append({"role": "user", "content": message})
response = ""
try:
client = get_client(model_name)
for msg in client.chat_completion(
messages,
max_tokens=max_tokens,
stream=True,
temperature=temperature,
top_p=top_p,
):
token = msg.choices[0].delta.get('content', None)
if token:
response += token
history = history + [[message, response]]
return "", history
except Exception as e:
error_msg = f"μΆλ‘ μ€ μ€λ₯κ° λ°μνμ΅λλ€: {str(e)}"
history = history + [[message, error_msg]]
return "", history
css = """
footer {visibility: hidden}
"""
# ... (μ΄μ μ½λ λμΌ)
with gr.Blocks(theme="Yntec/HaleyCH_Theme_Orange", css=css) as demo:
with gr.Row():
with gr.Column(scale=2):
chatbot = gr.Chatbot(height=600)
msg = gr.Textbox(
label="λ©μμ§λ₯Ό μ
λ ₯νμΈμ",
show_label=False,
placeholder="λ©μμ§λ₯Ό μ
λ ₯νμΈμ...",
container=False
)
clear = gr.ClearButton([msg, chatbot])
with gr.Column(scale=1):
model_name = gr.Dropdown(
choices=list(LLM_MODELS.keys()),
value="Default",
label="LLM λͺ¨λΈ μ ν",
info="μ¬μ©ν LLM λͺ¨λΈμ μ ννμΈμ"
)
file_upload = gr.File(
label="νμΌ μ
λ‘λ",
file_types=["text", ".parquet"], # νμΌ νμ
μμ
type="filepath"
)
with gr.Accordion("κ³ κΈ μ€μ ", open=False):
system_message = gr.Textbox(label="System Message", value="")
max_tokens = gr.Slider(minimum=1, maximum=8000, value=4000, label="Max Tokens")
temperature = gr.Slider(minimum=0, maximum=1, value=0.7, label="Temperature")
top_p = gr.Slider(minimum=0, maximum=1, value=0.9, label="Top P")
# μ΄λ²€νΈ λ°μΈλ©
msg.submit(
chat,
inputs=[msg, chatbot, file_upload, model_name, system_message, max_tokens, temperature, top_p],
outputs=[msg, chatbot]
)
# νμΌ μ
λ‘λ μ μλ λΆμ
file_upload.change(
chat,
inputs=[gr.Textbox(value="νμΌ λΆμμ μμν©λλ€."), chatbot, file_upload, model_name, system_message, max_tokens, temperature, top_p],
outputs=[msg, chatbot]
)
# μμ μΆκ°
gr.Examples(
examples=[
["μμΈν μ¬μ© λ°©λ²μ λ§μΉ νλ©΄μ 보면μ μ€λͺ
νλ―μ΄ 4000 ν ν° μ΄μ μμΈν μ€λͺ
νλΌ"],
["FAQ 20건μ μμΈνκ² μμ±νλΌ. 4000ν ν° μ΄μ μ¬μ©νλΌ."],
["μ¬μ© λ°©λ²κ³Ό μ°¨λ³μ , νΉμ§, κ°μ μ μ€μ¬μΌλ‘ 4000 ν ν° μ΄μ μ νλΈ μμ μ€ν¬λ¦½νΈ ννλ‘ μμ±νλΌ"],
["λ³Έ μλΉμ€λ₯Ό SEO μ΅μ ννμ¬ λΈλ‘κ·Έ ν¬μ€νΈλ‘ 4000 ν ν° μ΄μ μμ±νλΌ"],
["νΉν μΆμμ νμ©ν κΈ°μ λ° λΉμ¦λμ€λͺ¨λΈ μΈ‘λ©΄μ ν¬ν¨νμ¬ νΉν μΆμμ ꡬμ±μ λ§κ² μμ±νλΌ"],
["κ³μ μ΄μ΄μ λ΅λ³νλΌ"],
],
inputs=msg,
)
if __name__ == "__main__":
demo.launch() |