Spaces:
Sleeping
Sleeping
from transformers import AutoTokenizer | |
import transformers | |
import torch | |
from huggingface_hub import login | |
import os | |
login(token = os.getenv('HF_TOKEN')) | |
class Model(torch.nn.Module): | |
number_of_models = 0 | |
__model_list__ = [ | |
"lmsys/vicuna-7b-v1.5", | |
"meta-llama/Meta-Llama-3.1-8B" | |
] | |
def __init__(self, model_name="lmsys/vicuna-7b-v1.5") -> None: | |
super(Model, self).__init__() | |
self.tokenizer = AutoTokenizer.from_pretrained(model_name) | |
self.name = model_name | |
self.pipeline = transformers.pipeline( | |
"text-generation", | |
model=model_name, | |
tokenizer=self.tokenizer, | |
torch_dtype=torch.bfloat16, | |
device_map="auto", | |
) | |
self.update() | |
def update(cls): | |
cls.number_of_models += 1 | |
def return_mode_name(self): | |
return self.name | |
def return_tokenizer(self): | |
return self.tokenizer | |
def return_model(self): | |
return self.pipeline | |
def gen(self, content, temp=0.1, max_length=500): | |
sequences = self.pipeline( | |
content, | |
max_new_tokens=max_length, | |
do_sample=True, | |
temperature=temp, | |
num_return_sequences=1, | |
eos_token_id=self.tokenizer.eos_token_id, | |
return_full_text=False | |
) | |
return sequences[-1]['generated_text'] |