Spaces:

Pr123
/

TinyLlama-EA-Chat

Sleeping

Pr123 commited on Apr 1

Commit

dd17305

•

1 Parent(s): 8cbf8ae

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,11 +7,12 @@ import gradio as gr
 peft_model_id = "Pr123/TinyLlama-EA-Chat"
 # Load Model with PEFT adapter
 model = AutoPeftModelForCausalLM.from_pretrained(
     peft_model_id,
-    device_map="auto",
-    torch_dtype=torch.float16
-)
 tokenizer = AutoTokenizer.from_pretrained(peft_model_id)
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, max_length=500)

 peft_model_id = "Pr123/TinyLlama-EA-Chat"
 # Load Model with PEFT adapter
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model = AutoPeftModelForCausalLM.from_pretrained(
     peft_model_id,
+    torch_dtype=torch.float16  # Keeping half precision
+).to(device)
 tokenizer = AutoTokenizer.from_pretrained(peft_model_id)
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, max_length=500)