oleksandrfluxon commited on
Commit
fb80f65
1 Parent(s): d1aa94f

Update pipeline.py

Browse files
Files changed (1) hide show
  1. pipeline.py +1 -1
pipeline.py CHANGED
@@ -26,7 +26,7 @@ class PreTrainedPipeline():
26
  torch_dtype=torch.float16,
27
  trust_remote_code=True,
28
  device_map="auto",
29
- load_in_4bit=True # Load model in the lowest 4-bit precision quantization
30
  )
31
  model.to('cuda')
32
  print("===> model loaded")
 
26
  torch_dtype=torch.float16,
27
  trust_remote_code=True,
28
  device_map="auto",
29
+ load_in_8bit=True # Load model in the lowest 4-bit precision quantization
30
  )
31
  model.to('cuda')
32
  print("===> model loaded")