File size: 712 Bytes
fb5ea16
23f4335
278e84d
253248f
a300d2e
9b1724f
a300d2e
c11983f
 
a300d2e
 
 
 
 
 
 
 
aa8d870
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
import os 
import gradio as gr
import torch
from transformers import AutoTokenizer, AutoModelForCausalLM 

os.environ["CURL_CA_BUNDLE"]=""

tokenizer = AutoTokenizer.from_pretrained("togethercomputer/GPT-JT-6B-v0", force_download=True, local_files_only=False)
model = AutoModelForCausalLM.from_pretrained("togethercomputer/GPT-JT-6B-v0", torch_dtype=torch.bfloat16)

def gpt(prompt):
    inputs = tokenizer("<human>: Hello!\n<bot>:", return_tensors='pt').to(model.device)
    outputs = model.generate(**inputs, max_new_tokens=10, do_sample=True, temperature=0.8)
    output_str = tokenizer.decode(outputs[0])
    print(output_str)
    return output_str

gr.Interface(fn=gpt,inputs="text",outputs="text").launch()