mattritchey commited on
Commit
b6f32b8
1 Parent(s): c5b6761

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -51,13 +51,13 @@ tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
51
  quantization_config_loading = GPTQConfig(bits=4, disable_exllama=True) #MR Added
52
  model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float32, device_map="auto",
53
  trust_remote_code=True,
54
- quantization_config=quantization_config_loading #MR Added
55
  )
56
 
57
  # sentence transformers to be used in vector store
58
  embeddings = HuggingFaceEmbeddings(
59
  model_name="sentence-transformers/all-mpnet-base-v2", #Change MR
60
- model_kwargs={'device': 'auto'}, #Change MR
61
  encode_kwargs={'normalize_embeddings': False}
62
  )
63
 
 
51
  quantization_config_loading = GPTQConfig(bits=4, disable_exllama=True) #MR Added
52
  model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float32, device_map="auto",
53
  trust_remote_code=True,
54
+ # quantization_config=quantization_config_loading #MR Added
55
  )
56
 
57
  # sentence transformers to be used in vector store
58
  embeddings = HuggingFaceEmbeddings(
59
  model_name="sentence-transformers/all-mpnet-base-v2", #Change MR
60
+ model_kwargs={'device': 'cpu'},
61
  encode_kwargs={'normalize_embeddings': False}
62
  )
63