RAGBOT

Running

Rahatara commited on May 9

Commit

3994ed5

•

1 Parent(s): f361940

Update pdfchatbot.py

Files changed (1) hide show

pdfchatbot.py CHANGED Viewed

@@ -11,13 +11,16 @@ from langchain.document_loaders import PyPDFLoader
 from langchain.prompts import PromptTemplate
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
 class PDFChatBot:
     def __init__(self, config_path="config.yaml"):
         """
         Initialize the PDFChatBot instance.
         Parameters:
-            config_path (str): Path to the configuration file (default is "../config.yaml").
         """
         self.processed = False
         self.page = 0
@@ -94,7 +97,10 @@ class PDFChatBot:
         """
         Load the tokenizer from Hugging Face and set in the config file.
         """
-        self.tokenizer = AutoTokenizer.from_pretrained(self.config.get("autoTokenizer"))
     def load_model(self):
         """
@@ -104,7 +110,7 @@ class PDFChatBot:
             self.config.get("autoModelForCausalLM"),
             device_map='auto',
             torch_dtype=torch.float32,
-            token=True,
             load_in_8bit=False
         )
@@ -190,4 +196,4 @@ class PDFChatBot:
         page = doc[self.page]
         pix = page.get_pixmap(matrix=fitz.Matrix(300 / 72, 300 / 72))
         image = Image.frombytes('RGB', [pix.width, pix.height], pix.samples)
-        return image

 from langchain.prompts import PromptTemplate
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
+# Store the Hugging Face token in a variable
+HUGGINGFACE_TOKEN = gr.Textbox()
 class PDFChatBot:
     def __init__(self, config_path="config.yaml"):
         """
         Initialize the PDFChatBot instance.
         Parameters:
+            config_path (str): Path to the configuration file (default is "config.yaml").
         """
         self.processed = False
         self.page = 0
         """
         Load the tokenizer from Hugging Face and set in the config file.
         """
+        self.tokenizer = AutoTokenizer.from_pretrained(
+            self.config.get("autoTokenizer"),
+            use_auth_token=HUGGINGFACE_TOKEN
+        )
     def load_model(self):
         """
             self.config.get("autoModelForCausalLM"),
             device_map='auto',
             torch_dtype=torch.float32,
+            use_auth_token=HUGGINGFACE_TOKEN,
             load_in_8bit=False
         )
         page = doc[self.page]
         pix = page.get_pixmap(matrix=fitz.Matrix(300 / 72, 300 / 72))
         image = Image.frombytes('RGB', [pix.width, pix.height], pix.samples)
+        return image