Spaces:

QaillcNextGen
/

phi_faster

Build error

mattritchey commited on Jan 31

Commit

b6f32b8

•

1 Parent(s): c5b6761

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -51,13 +51,13 @@ tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
 quantization_config_loading = GPTQConfig(bits=4, disable_exllama=True) #MR Added
 model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float32, device_map="auto",
                                              trust_remote_code=True,
-                                             quantization_config=quantization_config_loading #MR Added
                                              )
 # sentence transformers to be used in vector store
 embeddings = HuggingFaceEmbeddings(
       model_name="sentence-transformers/all-mpnet-base-v2", #Change MR
-      model_kwargs={'device': 'auto'}, #Change MR
       encode_kwargs={'normalize_embeddings': False}
   )

 quantization_config_loading = GPTQConfig(bits=4, disable_exllama=True) #MR Added
 model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float32, device_map="auto",
                                              trust_remote_code=True,
+                                             # quantization_config=quantization_config_loading #MR Added
                                              )
 # sentence transformers to be used in vector store
 embeddings = HuggingFaceEmbeddings(
       model_name="sentence-transformers/all-mpnet-base-v2", #Change MR
+      model_kwargs={'device': 'cpu'},
       encode_kwargs={'normalize_embeddings': False}
   )