Spaces:

srijaydeshpande
/

DeID

Running on Zero

App Files Files Community

srijaydeshpande commited on May 12

Commit

127c875

•

1 Parent(s): 72540c8

Update

Browse files

Files changed (1) hide show

app.py +50 -50

app.py CHANGED Viewed

@@ -4,13 +4,13 @@ from tqdm import tqdm
 import re
 import gradio as gr
 import os
-# from llama_cpp import Llama
 # from gpt4all import GPT4All
 import transformers
 # from transformers import GemmaTokenizer, AutoModelForCausalLM
 # from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
-import accelerate
-import torch
 # HF_TOKEN = os.environ.get("HF_TOKEN", None)
@@ -73,49 +73,49 @@ def deidentify_doc(pdftext=""):
     prompt = "Please anonymize the following clinical note. Replace all the following information with the term '[redacted]': Redact any strings that might be a name or initials, patients’ names, doctors’ names, the names Dr., redact any medical staff names, redact any strings that might be a location or address, such as '3970 Longview Drive', redact any strings that look like 'age 37', redact any dates and registration numbers, redact professions such as 'manager', redact any contact information."
-    # print('Input prompt is ',prompt)
-    # print('Input pdf text is ',pdftext)
-    # output = model.create_chat_completion(
-    #                 messages = [
-    #                     {"role": "assistant", "content": prompt},
-    #                     {
-    #                         "role": "user",
-    #                         "content": pdftext
-    #                     }
-    #                 ],
-    #                 max_tokens=600,
-    #                 temperature=0
-    #             )
-    # output = output['choices'][0]['message']['content']
     # if (pdftext):
     #     prompt = prompt + ': ' + pdftext
     # output = model.generate(prompt=prompt, max_tokens=1024, n_batch=128)
-    messages = [
-        {"role": "assistant",
-         "content": prompt},
-        {"role": "user",
-         "content": pdftext}, ]
-    prompt = model.tokenizer.apply_chat_template(
-        messages,
-        tokenize=False,
-        add_generation_prompt=True
-    )
-    terminators = [
-        model.tokenizer.eos_token_id,
-        model.tokenizer.convert_tokens_to_ids("<|eot_id|>")
-    ]
-    outputs = model(
-        prompt,
-        max_new_tokens=1024,
-        eos_token_id=terminators,
-        do_sample=True,
-        temperature=0.3,
-        top_p=0.95,
-    )
-    output = outputs[0]["generated_text"][len(prompt):]
     return output
@@ -130,19 +130,19 @@ def pdf_to_text(file):
         file.write(html)
     return html
-# model_id = "Meta-Llama-3-8B-Instruct.Q5_K_M.gguf"
-# model = Llama(model_path=model_id, n_ctx=2048, n_threads=8, n_gpu_layers=32, n_batch=64)
 # model = GPT4All("Meta-Llama-3-8B-Instruct.Q4_0.gguf", n_threads=8, device='gpu')
 # model.chat_session()
-model_id = "Meta-Llama-3-8B-Instruct"
-model = transformers.pipeline(
-    "text-generation",
-    model=model_id,
-    model_kwargs={"torch_dtype": torch.bfloat16},
-    device="cuda",
-)
 css = ".gradio-container {background: 'logo.png'}"

 import re
 import gradio as gr
 import os
+from llama_cpp import Llama
 # from gpt4all import GPT4All
 import transformers
 # from transformers import GemmaTokenizer, AutoModelForCausalLM
 # from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
+import accelerate
+import torch
 # HF_TOKEN = os.environ.get("HF_TOKEN", None)
     prompt = "Please anonymize the following clinical note. Replace all the following information with the term '[redacted]': Redact any strings that might be a name or initials, patients’ names, doctors’ names, the names Dr., redact any medical staff names, redact any strings that might be a location or address, such as '3970 Longview Drive', redact any strings that look like 'age 37', redact any dates and registration numbers, redact professions such as 'manager', redact any contact information."
+    print('Input prompt is ',prompt)
+    print('Input pdf text is ',pdftext)
+    output = model.create_chat_completion(
+                    messages = [
+                        {"role": "assistant", "content": prompt},
+                        {
+                            "role": "user",
+                            "content": pdftext
+                        }
+                    ],
+                    max_tokens=600,
+                    temperature=0
+                )
+    output = output['choices'][0]['message']['content']
     # if (pdftext):
     #     prompt = prompt + ': ' + pdftext
     # output = model.generate(prompt=prompt, max_tokens=1024, n_batch=128)
+    # messages = [
+    #     {"role": "assistant",
+    #      "content": prompt},
+    #     {"role": "user",
+    #      "content": pdftext}, ]
+    # prompt = model.tokenizer.apply_chat_template(
+    #     messages,
+    #     tokenize=False,
+    #     add_generation_prompt=True
+    # )
+    # terminators = [
+    #     model.tokenizer.eos_token_id,
+    #     model.tokenizer.convert_tokens_to_ids("<|eot_id|>")
+    # ]
+    # outputs = model(
+    #     prompt,
+    #     max_new_tokens=1024,
+    #     eos_token_id=terminators,
+    #     do_sample=True,
+    #     temperature=0.3,
+    #     top_p=0.95,
+    # )
+    # output = outputs[0]["generated_text"][len(prompt):]
     return output
         file.write(html)
     return html
+model_id = "Meta-Llama-3-8B-Instruct.Q5_K_M.gguf"
+model = Llama(model_path=model_id, n_ctx=2048, n_threads=8, n_gpu_layers=-1, n_batch=64)
 # model = GPT4All("Meta-Llama-3-8B-Instruct.Q4_0.gguf", n_threads=8, device='gpu')
 # model.chat_session()
+# model_id = "D:/llama/meta-llama/Meta-Llama-3-8B-Instruct"
+# model = transformers.pipeline(
+#     "text-generation",
+#     model=model_id,
+#     model_kwargs={"torch_dtype": torch.bfloat16},
+#     device="cpu",
+# )
 css = ".gradio-container {background: 'logo.png'}"