Spaces:

ksh-nyp
/

TCM-QNA

Runtime error

ksh-nyp commited on Feb 19

Commit

9005c68

•

1 Parent(s): 0a70c0f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,47 @@
 import gradio as gr
 from transformers import pipeline
 # Initialize the pipeline with the LLaMA model

 import gradio as gr
+import os
+import torch
+from transformers import (
+    AutoModelForCausalLM,
+    AutoTokenizer,
+    BitsAndBytesConfig,
+    HfArgumentParser,
+    TrainingArguments,
+    pipeline,
+    logging,
+)
+################################################################################
+# bitsandbytes parameters
+################################################################################
+# Activate 4-bit precision base model loading
+use_4bit = True
+# Compute dtype for 4-bit base models
+bnb_4bit_compute_dtype = "float16"
+# Quantization type (fp4 or nf4)
+bnb_4bit_quant_type = "nf4"
+# Activate nested quantization for 4-bit base models (double quantization)
+use_nested_quant = False
+################################################################################
+# SFT parameters
+################################################################################
+# Maximum sequence length to use
+max_seq_length = None
+# Pack multiple short examples in the same input sequence to increase efficiency
+packing = False
+# Load the entire model on the GPU 0
+device_map = {"": 0}
 from transformers import pipeline
 # Initialize the pipeline with the LLaMA model