nikravan commited on
Commit
148c35f
1 Parent(s): 4aeaa92

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -39,10 +39,11 @@ quantization_config = BitsAndBytesConfig(
39
 
40
  model = AutoModelForCausalLM.from_pretrained(
41
  MODEL_ID,
42
-
 
43
  low_cpu_mem_usage=True,
44
  trust_remote_code=True,
45
- return_dict=True,
46
  quantization_config=quantization_config
47
  )
48
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
 
39
 
40
  model = AutoModelForCausalLM.from_pretrained(
41
  MODEL_ID,
42
+ torch_dtype=inference_dtype,
43
+ device_map = "cuda:0",
44
  low_cpu_mem_usage=True,
45
  trust_remote_code=True,
46
+
47
  quantization_config=quantization_config
48
  )
49
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)