|
import gradio as gr |
|
import cohere |
|
import os |
|
import re |
|
import uuid |
|
import secrets |
|
|
|
|
|
|
|
cohere_api_key = os.getenv("COHERE_API_KEY") |
|
co = cohere.Client(cohere_api_key, client_name="huggingface-aya-23") |
|
|
|
|
|
def trigger_example(example): |
|
chat, updated_history = generate_response(example) |
|
return chat, updated_history |
|
|
|
def generate_response(user_message, cid, token, history=None): |
|
|
|
if not token: |
|
raise gr.Error("Error loading.") |
|
|
|
if history is None: |
|
history = [] |
|
if cid == "" or None: |
|
cid = str(uuid.uuid4()) |
|
|
|
print(f"cid: {cid} prompt:{user_message}") |
|
|
|
history.append(user_message) |
|
|
|
stream = co.chat_stream(message=user_message, conversation_id=cid, model='c4ai-aya-23', connectors=[], temperature=0.3) |
|
|
|
output = "" |
|
|
|
for idx, response in enumerate(stream): |
|
if response.event_type == "text-generation": |
|
output += response.text |
|
if idx == 0: |
|
history.append(" " + output) |
|
else: |
|
history[-1] = output |
|
chat = [ |
|
(history[i].strip(), history[i + 1].strip()) |
|
for i in range(0, len(history) - 1, 2) |
|
] |
|
yield chat, history, cid |
|
|
|
return chat, history, cid |
|
|
|
|
|
def clear_chat(): |
|
return [], [], str(uuid.uuid4()) |
|
|
|
|
|
examples = [ |
|
"Explain the relativity theory in French", |
|
"Como sair de um helicóptero que caiu na água?", |
|
"¿Cómo le explicarías el aprendizaje automático a un extraterrestre?", |
|
"Explain gravity to a chicken.", |
|
"Descrivi il processo di creazione di un capolavoro, come se fossi un artista del Rinascimento a Firenze.", |
|
"Anneme onu ne kadar sevdiğimi anlatan bir mektup yaz", |
|
"Explique-moi le sens de la vie selon un grand auteur littéraire.", |
|
"Give me an example of an endangered species and let me know what I can do to help preserve it", |
|
"یک پاراگراف در مورد زیباییهای طبیعت در فصل پاییز بنویس", |
|
"Wie kann ich lernen, selbstbewusster zu werden?", |
|
"Formally introduce the transformer architecture with notation.", |
|
] |
|
|
|
custom_css = """ |
|
#logo-img { |
|
border: none !important; |
|
} |
|
#chat-message { |
|
font-size: 14px; |
|
min-height: 300px; |
|
} |
|
""" |
|
|
|
with gr.Blocks(analytics_enabled=False, css=custom_css) as demo: |
|
cid = gr.State("") |
|
token = gr.State(value=None) |
|
|
|
with gr.Row(): |
|
with gr.Column(scale=1): |
|
gr.Image("aya-logo.png", elem_id="logo-img", show_label=False, show_share_button=False, show_download_button=False) |
|
with gr.Column(scale=3): |
|
gr.Markdown("""C4AI Aya 23 is a research open weights release of an 8 and 35 billion parameter with highly advanced instruction fine-tuned model, covering 23 languages: Arabic, Chinese (simplified & traditional), Czech, Dutch, English, French, German, Greek, Hebrew, Hindi, Indonesian, Italian, Japanese, Korean, Persian, Polish, Portuguese, Romanian, Russian, Spanish, Turkish, Ukrainian, and Vietnamese. |
|
<br/> |
|
**Note**: Aya 23 is a single-turn instruction-following model and it is not optimized for chat mode use. |
|
<br/> |
|
**Model**: [aya-23-35B](https://huggingface.co/CohereForAI/aya-23-35B) |
|
<br/> |
|
**Developed by**: [Cohere for AI](https://cohere.com/research) and [Cohere](https://cohere.com/) |
|
<br/> |
|
**License**: [CC-BY-NC](https://cohere.com/c4ai-cc-by-nc-license), requires also adhering to [C4AI's Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy) |
|
""" |
|
) |
|
|
|
with gr.Column(): |
|
with gr.Row(): |
|
chatbot = gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True) |
|
|
|
with gr.Row(): |
|
user_message = gr.Textbox(lines=1, placeholder="Ask anything ...", label="Input", show_label=False) |
|
|
|
|
|
with gr.Row(): |
|
submit_button = gr.Button("Submit") |
|
clear_button = gr.Button("Clear chat") |
|
|
|
|
|
history = gr.State([]) |
|
|
|
user_message.submit(fn=generate_response, inputs=[user_message, cid, token, history], outputs=[chatbot, history, cid], concurrency_limit=32) |
|
submit_button.click(fn=generate_response, inputs=[user_message, cid, token, history], outputs=[chatbot, history, cid], concurrency_limit=32) |
|
|
|
clear_button.click(fn=clear_chat, inputs=None, outputs=[chatbot, history, cid], concurrency_limit=32) |
|
|
|
user_message.submit(lambda x: gr.update(value=""), None, [user_message], queue=False) |
|
submit_button.click(lambda x: gr.update(value=""), None, [user_message], queue=False) |
|
clear_button.click(lambda x: gr.update(value=""), None, [user_message], queue=False) |
|
|
|
with gr.Row(): |
|
gr.Examples( |
|
examples=examples, |
|
inputs=user_message, |
|
cache_examples=False, |
|
fn=trigger_example, |
|
outputs=[chatbot], |
|
examples_per_page=100 |
|
) |
|
|
|
demo.load(lambda: secrets.token_hex(16), None, token) |
|
|
|
if __name__ == "__main__": |
|
|
|
try: |
|
demo.queue(api_open=False, max_size=40).launch(show_api=False) |
|
except Exception as e: |
|
print(f"Error: {e}") |