chatbaichuan7B / app.py
gaogao131's picture
Create app.py
08601b5
raw
history blame
749 Bytes
import gradio as gr
from transformers import AutoModelForCausalLM, AutoTokenizer
tokenizer = AutoTokenizer.from_pretrained("baichuan-inc/baichuan-7B", trust_remote_code=True)
model = AutoModelForCausalLM.from_pretrained("baichuan-inc/baichuan-7B", device_map="auto", trust_remote_code=True)
def greet(name):
# inputs = tokenizer('登鹳雀楼->王之涣\n夜雨寄北->', return_tensors='pt')
inputs = tokenizer(name, return_tensors='pt')
inputs = inputs.to('cuda:0')
pred = model.generate(**inputs, max_new_tokens=64,repetition_penalty=1.1)
result = tokenizer.decode(pred.cpu()[0], skip_special_tokens=True)
return "Hello:: " + result + "::!!"
iface = gr.Interface(fn=greet, inputs="text", outputs="text")
iface.launch()