Spaces:

3B-Group
/

ConvRe-Leaderboard

Sleeping

Trayvon commited on Oct 8, 2023

Commit

66d5e37

•

1 Parent(s): 17976d5

Update src/demo.py

Files changed (1) hide show

src/demo.py CHANGED Viewed

@@ -22,7 +22,7 @@ type2dataset = {
 model_id = "meta-llama/Llama-2-7b-chat-hf"
 tokenizer = AutoTokenizer.from_pretrained(model_id, token=TOKEN)
-model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.bfloat16, token=TOKEN).eval()
 # type2dataset = {}
@@ -35,7 +35,7 @@ def generate(input_text, sys_prompt) -> str:
 '''
     input_str = sys_prompt + input_text + " [/INST]"
-    input_ids = tokenizer(input_str, return_tensors="pt").input_ids
     outputs = model.generate(input_ids, max_length=512)
     result = tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]

 model_id = "meta-llama/Llama-2-7b-chat-hf"
 tokenizer = AutoTokenizer.from_pretrained(model_id, token=TOKEN)
+model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.bfloat16, token=TOKEN, device_map="auto").eval()
 # type2dataset = {}
 '''
     input_str = sys_prompt + input_text + " [/INST]"
+    input_ids = tokenizer(input_str, return_tensors="pt").input_ids.to('cuda')
     outputs = model.generate(input_ids, max_length=512)
     result = tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]