Krooz commited on
Commit
8e53aab
1 Parent(s): ab4d7cc

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -33,12 +33,12 @@ def run_model(report):
33
 
34
  # load base LLM model, LoRA params and tokenizer
35
  model = AutoPeftModelForCausalLM.from_pretrained(
36
- "Krooz/placement-classification-mistral-7b-instruct-v1",
37
  low_cpu_mem_usage=True,
38
  torch_dtype=torch.float16,
39
- load_in_4bit=True
40
  )
41
- tokenizer = AutoTokenizer.from_pretrained("Krooz/placement-classification-mistral-7b-instruct-v1")
42
  input_ids = tokenizer(prompt, return_tensors="pt", truncation=True).input_ids.cpu()
43
 
44
  # inference
 
33
 
34
  # load base LLM model, LoRA params and tokenizer
35
  model = AutoPeftModelForCausalLM.from_pretrained(
36
+ os.getenv("Model_Repo_ID"),
37
  low_cpu_mem_usage=True,
38
  torch_dtype=torch.float16,
39
+ #load_in_4bit=True
40
  )
41
+ tokenizer = AutoTokenizer.from_pretrained(os.getenv("Model_Repo_ID"))
42
  input_ids = tokenizer(prompt, return_tensors="pt", truncation=True).input_ids.cpu()
43
 
44
  # inference