Spaces:

wgetdd
/

QLORA-Phi2

Sleeping

App Files Files Community

wgetdd commited on Dec 21, 2023

Commit

321de10

•

1 Parent(s): 3814244

inference code

Browse files

Files changed (3) hide show

app.py +67 -0
inference.py +28 -0
requirments.txt +8 -0

app.py ADDED Viewed

	@@ -0,0 +1,67 @@

+import gradio as gr
+from torchvision import transforms
+import torch
+from inference import run_inference
+description_zero_shot_training = """ ### Zero Shot Training
+                1. Choose a Dataset MNIST/CIFAR10
+                2. Output will be class accuracy
+              """
+# Description
+title = "<center><strong><font size='8'>📎 THE CLIP PLAYGROUND 📎</font></strong></center>"
+text_input = gr.Text(label="Enter text")
+text_input2 = gr.Text(label="Generated Response")
+css = "h1 { text-align: center } .about { text-align: justify; padding-left: 10%; padding-right: 10%; }"
+with gr.Blocks(css=css, title='Play with CLIP') as demo:
+    with gr.Row():
+        with gr.Column(scale=1):
+            # Title
+            gr.Markdown(title)
+    with gr.Tab("chat_with_phi2"):
+        # Images
+        with gr.Row(variant="panel"):
+            with gr.Column(scale=1):
+                text_input.render()
+            with gr.Column(scale=1):
+                text_input2.render()
+        # Submit & Clear
+        with gr.Row():
+            with gr.Column():
+                run_chat_with_phi2_button = gr.Button("chat_with_phi2", variant='primary')
+                clear_btn_text_to_image = gr.Button("Clear", variant="secondary")
+                gr.Markdown(description_zero_shot_training)
+                gr.Examples(examples = ["What is Large Language models ?", "Can you write a short introduction about the relevance of the term monopsony in economics? Please use examples related to potential monopsonies in the labour market and cite relevant research.", "I want to start doing astrophotography as a hobby, any suggestions what could i do?"],
+                            inputs=[text_input],
+                            outputs=text_input2,
+                            fn=run_inference,
+                            cache_examples=True,
+                            examples_per_page=4)
+    run_chat_with_phi2_button.click(run_inference,
+                        inputs=[
+                            text_input,
+                        ],
+                        outputs=text_input2)
+    #######################################################################################################################
+    def clear():
+        return None, None
+    def clear_text():
+        return None, None, None
+    clear_btn_text_to_image.click(clear, outputs=[text_input, text_input2])
+demo.queue()
+demo.launch()

inference.py ADDED Viewed

	@@ -0,0 +1,28 @@

+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, AutoTokenizer,pipeline
+model_name = "trained_model/content/results/checkpoint-500"
+bnb_config = BitsAndBytesConfig(
+    load_in_4bit=True,
+    bnb_4bit_quant_type="nf4",
+    bnb_4bit_compute_dtype=torch.float16,
+)
+model = AutoModelForCausalLM.from_pretrained(
+    model_name,
+    quantization_config=bnb_config,
+    trust_remote_code=True
+)
+model.config.use_cache = False
+tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
+tokenizer.pad_token = tokenizer.eos_token
+# Run text generation pipeline with our next model
+pipe = pipeline(task="text-generation", model=model, tokenizer=tokenizer, max_length=200)
+def run_inference(prompt):
+    result = pipe(f"<s>[INST] {prompt} [/INST]")
+    return result[0]['generated_text']

requirments.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+trl
+transformers
+accelerate
+git+https://github.com/huggingface/peft.git
+datasets
+bitsandbytes
+einops
+wandb