import os # we need to compile a OPENBLAS version for cpu # Or get it from https://jllllll.github.io/llama-cpp-python-cuBLAS-wheels/ os.system('CMAKE_ARGS="-DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS" pip install llama-cpp-python==0.2.11') import re, requests, json import gradio as gr import random import torch from itertools import chain import asyncio from llama_cpp import Llama import datetime from transformers import ( StoppingCriteriaList, MaxLengthCriteria, ) # Created by # https://huggingface.co/gorkemgoknar #Coqui V1 api render voice, you can also use XTTS #COQUI_URL="https://app.coqui.ai/api/v2/samples" COQUI_URL="https://app.coqui.ai/api/v2/samples/xtts" COQUI_URL_EN="https://app.coqui.ai/api/v2/samples/xtts/render/" ### Warning each sample will consume your credits COQUI_TOKEN=os.environ.get("COQUI_TOKEN") PER_RUN_MAX_VOICE=int( os.environ.get("PER_RUN_MAX_VOICE") ) PER_RUN_COUNTER=0 RUN_START_HOUR=datetime.datetime.now().hour MAX_NEW_TOKENS = 30 GPU_LAYERS = 0 STOP_LIST=["###","##"] LLAMA_VERBOSE=False TITLE = "

PER_RUN_MAX_VOICE): gr.Warning("Unfortunately voice limit is reached, try again after another time, or use without voice") WITH_AUDIO=0 else: if with_voice==VOICE_CHOICES[0]: WITH_AUDIO=1 else: WITH_AUDIO=0 return with_voice, WITH_AUDIO with gr.Blocks(css=css) as interface: VOICE_COUNTER=gr.State(value=0) WITH_AUDIO=gr.State(value=1) VOICE_LIMIT=int( os.environ.get("VOICE_LIMIT") ) with gr.Row(): gr.HTML(TITLE, elem_id="banner") gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text") with gr.Row(): drop_char1 = gr.components.Dropdown(CHARACTER_1_CHOICES,label="Character 1",value=CHARACTER_1_CHOICES[0]) drop_char2 = gr.components.Dropdown(CHARACTER_2_CHOICES,label="Character 2",value=CHARACTER_2_CHOICES[1]) run_count = gr.components.Dropdown(RUN_COUNT,label="Line count per character",value="2") with gr.Row(): context_choice = gr.components.Dropdown(CONTEXT_CHOICES, label="Context",value=CONTEXT_CHOICES[0]) with gr.Row(): with_voice = gr.components.Dropdown(VOICE_CHOICES,label="Voice via Coqui.ai (demo)",value=VOICE_CHOICES[0]) with gr.Row(): txt = gr.Textbox( show_label=False, placeholder="Enter text and press enter, or upload an image", value=EXAMPLE_INITIALS[0],elem_classes="user_msg" ) submit_btn = gr.Button(value="Submit") examples = gr.Examples(examples=EXAMPLE_INITIALS, inputs=[txt]) with gr.Row(): with gr.Column(): history = gr.Textbox(lines=25, show_label=True, label="History", placeholder="History", ).style(height=50) with gr.Column(): audio1 = gr.Audio(elem_id="audio1",elem_classes="audio",autoplay=False,visible=False) audio2 = gr.Audio(elem_id="audio2",elem_classes="audio",autoplay=False,visible=False) audio3 = gr.Audio(elem_id="audio3",elem_classes="audio",autoplay=False,visible=False) audio4 = gr.Audio(elem_id="audio4",elem_classes="audio",autoplay=False,visible=False) audio5 = gr.Audio(elem_id="audio5",elem_classes="audio",autoplay=False,visible=False) audio6 = gr.Audio(elem_id="audio6",elem_classes="audio",autoplay=False,visible=False) audio7 = gr.Audio(elem_id="audio7",elem_classes="audio",autoplay=False,visible=False) audio8 = gr.Audio(elem_id="audio8",elem_classes="audio",autoplay=False,visible=False) with_voice.change(switch_voice,[with_voice,WITH_AUDIO,VOICE_COUNTER],[with_voice,WITH_AUDIO]) run_count.change(change_run_count,[run_count],[audio1,audio2,audio3,audio4,audio5,audio6,audio7,audio8]) submit_btn.click(add_text, [WITH_AUDIO,drop_char1, drop_char2,run_count, context_choice, txt,history,VOICE_COUNTER], [txt,history,audio1,audio2,audio3,audio4,audio5,audio6,audio7,audio8,VOICE_COUNTER], api_name="chat") interface.queue().launch()