minhdang commited on
Commit
efa875e
1 Parent(s): 5834081

Update inference.py

Browse files
Files changed (1) hide show
  1. inference.py +1 -1
inference.py CHANGED
@@ -36,7 +36,7 @@ from deepseek_vl.utils.conversation import Conversation
36
  from transformers import BitsAndBytesConfig
37
  from transformers import QuantoConfig
38
 
39
- quanto_config = QuantoConfig(weights="int8")
40
 
41
  def load_model(model_path):
42
  vl_chat_processor: VLChatProcessor = VLChatProcessor.from_pretrained(model_path)
 
36
  from transformers import BitsAndBytesConfig
37
  from transformers import QuantoConfig
38
 
39
+ quanto_config = QuantoConfig(weights="int4")
40
 
41
  def load_model(model_path):
42
  vl_chat_processor: VLChatProcessor = VLChatProcessor.from_pretrained(model_path)