Spaces:

Q4234
/

a1

Runtime error

File size: 1,163 Bytes

b235afa
 
e1b6041
 
711fde0
 
4406c32
b235afa
711fde0
 
 
6a8a445
35d2c47
4406c32
8f108e1
35d2c47
 
8f108e1
 
 
 
 
 
 
4406c32
 
 
6a8a445
4406c32
 
 
 
 
8f108e1
4406c32
8f108e1
4406c32
 
711fde0
 
4406c32
711fde0
 
4406c32
 
 
 
 
b235afa

import gradio as gr

import ctransformers

class Z(object):
    def __init__(self):
        self.llm = None

    def init(self):
        pass

    def greet(self, txt0):
        prompt0 = txt0

        # for Wizard-Vicuna-13B
        prompt00 = f'''USER: {prompt0}
ASSISTANT:'''

        prompt00 = f'''Below is an instruction that describes a task. Write a response that appropriately completes the request.

### Instruction:
{prompt0}

### Response:'''
        
        response0 = llm(prompt00, max_new_tokens=128, temperature=0.5) # 0.3
        
        return f'{response0}'

from ctransformers import AutoModelForCausalLM

# wizzard vicuna
# see https://github.com/melodysdreamj/WizardVicunaLM
#llm = AutoModelForCausalLM.from_pretrained('TheBloke/Wizard-Vicuna-13B-Uncensored-GGML', model_file='Wizard-Vicuna-13B-Uncensored.ggmlv3.q4_0.bin', model_type='llama')

llm = AutoModelForCausalLM.from_pretrained('mverrilli/dolly-v2-12b-ggml', model_file='ggml-model-q5_0.bin', model_type='dolly')



z = Z()
z.llm = llm
z.init()

def greet(arg0):
    global z
    return z.greet(arg0)

iface = gr.Interface(fn=greet, inputs="text", outputs="text")
iface.launch()