File size: 12,772 Bytes
5af46fb
 
 
ae70e6a
c33d018
9bfc3b6
c33d018
21856fb
cef6f84
c33d018
 
 
ae70e6a
c33d018
 
 
 
 
 
ae70e6a
c33d018
 
68f7742
c33d018
 
 
 
 
ae70e6a
c33d018
 
 
8d7ca1f
c33d018
 
 
 
 
 
f9bde5f
1824ff5
c33d018
ae70e6a
5af46fb
 
ae70e6a
5af46fb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
ae70e6a
2db3da4
3759f51
ae70e6a
bf88d0f
21c49f2
 
 
 
 
 
f26a575
21c49f2
 
e011fe4
 
 
 
 
 
 
21c49f2
f17637f
b7fdb16
f17637f
 
 
b7fdb16
 
 
 
 
 
f17637f
b7fdb16
 
f17637f
21c49f2
5213f60
21c49f2
ae70e6a
 
5af46fb
4bb75ae
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
import gradio as gr
from huggingface_hub import InferenceClient

# Markdown description
DESCRIPTION = '''
<div>
<h1 style="text-align: center;">zephyr-7b-beta</h1>
<p>This Space demonstrates the instruction-tuned model <b>zephyr-7b-beta by Hugging face</b>. zephyr-7b-beta is the new open 7B parameter GPT-like model fine-tuned on a mix of publicly available, synthetic datasets.<br><i>It can work as a summarizer, sentiment analyzer and Q/A chatbot with multiple other facilities.</i> 
<br>Feel free to play with it, or duplicate to run privately!</p>
</div>
'''

# License markdown
LICENSE = """
<p/>
---
Built with zephyr-7b-beta
"""

# Placeholder HTML
PLACEHOLDER = """
<div style="padding: 30px; text-align: center; display: flex; flex-direction: column; align-items: center;">
   <img src="" style="width: 80%; max-width: 550px; height: auto; opacity: 0.55;  "> 
   <h1 style="font-size: 28px; margin-bottom: 2px; opacity: 0.55;">zephyr-7b-beta</h1>
   <p style="font-size: 18px; margin-bottom: 2px; opacity: 0.65;">Ask me anything...</p>
</div>
"""

# CSS styles
css = """
h1 {
  text-align: center;
  display:block;
}
#duplicate-button {
  margin: auto;
  color: white;
  background: #1565c0;
  border-radius: 100vh;
}
"""

# Initialize InferenceClient
client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")

# Function to respond to user messages
def respond(
    message,
    history: list[tuple[str, str]],
    system_message,
    max_tokens,
    temperature,
    top_p,
):
    messages = [{"role": "system", "content": system_message}]

    for val in history:
        if val[0]:
            messages.append({"role": "user", "content": val[0]})
        if val[1]:
            messages.append({"role": "assistant", "content": val[1]})

    messages.append({"role": "user", "content": message})

    response = ""

    for message in client.chat_completion(
        messages,
        max_tokens=max_tokens,
        stream=True,
        temperature=temperature,
        top_p=top_p,
    ):
        token = message.choices[0].delta.content

        response += token
        yield response

# Create a Chatbot
chatbot=gr.Chatbot(height=450, placeholder=PLACEHOLDER, label='Gradio ChatInterface')

# Define the interface layout
with gr.Blocks(fill_height=True,css=css) as demo:
    # Add description markdown
    gr.Markdown(DESCRIPTION)
    # Add duplicate button
    gr.DuplicateButton(value="Duplicate Space for private use", elem_id="duplicate-button")
    # Add chat interface
    gr.ChatInterface(
        fill_height=True,
        fn=respond,
        chatbot=chatbot,
        examples=[
            ['How to setup a human base on Mars? Give short answer.'],
            ['Explain theory of relativity to me like I’m 8 years old.'],
            ['What is 9,000 * 9,000?'],
            ['Write a pun-filled happy birthday message to my friend Alex.'],
            ['Justify why a penguin might make a good king of the jungle.']
        ],
        cache_examples=False,
        additional_inputs_accordion = gr.Accordion(label="⚙️ Parameters", open=False, render= False),
            additional_inputs = [
                gr.Textbox(value="You are a friendly Chatbot.", label="System message",render= False),
                gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens",render= False),
                gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature",render= False),
                gr.Slider(
                    minimum=0.1,
                    maximum=1.0,
                    value=0.95,
                    step=0.05,
                    label="Top-p (nucleus sampling)",
                    render= False
                ),
            ]
        
    )
        # Add license markdown
    gr.Markdown(LICENSE)

# Launch the interface
if __name__ == "__main__":
    demo.launch(share=True)