Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -33,12 +33,12 @@ def run_model(report):
|
|
33 |
|
34 |
# load base LLM model, LoRA params and tokenizer
|
35 |
model = AutoPeftModelForCausalLM.from_pretrained(
|
36 |
-
"
|
37 |
low_cpu_mem_usage=True,
|
38 |
torch_dtype=torch.float16,
|
39 |
-
load_in_4bit=True
|
40 |
)
|
41 |
-
tokenizer = AutoTokenizer.from_pretrained("
|
42 |
input_ids = tokenizer(prompt, return_tensors="pt", truncation=True).input_ids.cpu()
|
43 |
|
44 |
# inference
|
|
|
33 |
|
34 |
# load base LLM model, LoRA params and tokenizer
|
35 |
model = AutoPeftModelForCausalLM.from_pretrained(
|
36 |
+
os.getenv("Model_Repo_ID"),
|
37 |
low_cpu_mem_usage=True,
|
38 |
torch_dtype=torch.float16,
|
39 |
+
#load_in_4bit=True
|
40 |
)
|
41 |
+
tokenizer = AutoTokenizer.from_pretrained(os.getenv("Model_Repo_ID"))
|
42 |
input_ids = tokenizer(prompt, return_tensors="pt", truncation=True).input_ids.cpu()
|
43 |
|
44 |
# inference
|