api-rag-index-chat

Runtime error

Chris4K commited on Feb 3, 2024

Commit

9e6c18e

verified ·

1 Parent(s): b66acba

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,10 +13,16 @@ model_name = "bn22/Mistral-7B-Instruct-v0.1-sharded"
 # function for loading 4-bit quantized model
 def load_quantized_model(model_name: str):
     """
     :param model_name: Name or path of the model to be loaded.
     :return: Loaded quantized model.
-    """
     bnb_config = BitsAndBytesConfig(
         load_in_4bit=True,
         bnb_4bit_use_double_quant=True,
@@ -29,7 +35,7 @@ def load_quantized_model(model_name: str):
         load_in_4bit=True,
         torch_dtype=torch.bfloat16,
         quantization_config=bnb_config
-    )
     return model
 ##################################################

 # function for loading 4-bit quantized model
 def load_quantized_model(model_name: str):
+    model = HuggingFaceHub(
+        repo_id="google/flan-ul2",
+        model_kwargs={"temperature":0.1,
+                      "max_new_tokens":256})
     """
     :param model_name: Name or path of the model to be loaded.
     :return: Loaded quantized model.
     bnb_config = BitsAndBytesConfig(
         load_in_4bit=True,
         bnb_4bit_use_double_quant=True,
         load_in_4bit=True,
         torch_dtype=torch.bfloat16,
         quantization_config=bnb_config
+    )"""
     return model
 ##################################################