ohmreborn commited on
Commit
10711d5
β€’
1 Parent(s): 4c3d1f2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -20,7 +20,8 @@ def main(
20
  model = LlamaForCausalLM.from_pretrained(
21
  base_model,
22
  load_in_8bit=load_8bit,
23
- device_map={"": device},
 
24
  low_cpu_mem_usage=True
25
  )
26
  model = PeftModel.from_pretrained(
@@ -28,7 +29,6 @@ def main(
28
  lora_weights,
29
  device_map={"": device},
30
  )
31
- model = model.merge_and_unload()
32
 
33
 
34
  model.config.pad_token_id = tokenizer.pad_token_id = 0
 
20
  model = LlamaForCausalLM.from_pretrained(
21
  base_model,
22
  load_in_8bit=load_8bit,
23
+ max_memory={"cpu":"15GiB"},
24
+ device_map="auto",
25
  low_cpu_mem_usage=True
26
  )
27
  model = PeftModel.from_pretrained(
 
29
  lora_weights,
30
  device_map={"": device},
31
  )
 
32
 
33
 
34
  model.config.pad_token_id = tokenizer.pad_token_id = 0