Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -74,7 +74,7 @@ def predict(message, history, system_prompt, temperature, max_new_tokens, top_k,
|
|
74 |
# Load model
|
75 |
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
|
76 |
quantization_config = BitsAndBytesConfig(
|
77 |
-
load_in_4bit=
|
78 |
bnb_4bit_compute_dtype=torch.bfloat16
|
79 |
)
|
80 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
@@ -91,12 +91,9 @@ gr.ChatInterface(
|
|
91 |
title=EMOJI + " " + MODEL_NAME,
|
92 |
description=DESCRIPTION,
|
93 |
examples=[
|
94 |
-
["
|
95 |
-
["
|
96 |
-
["
|
97 |
-
["Use a list comprehension to create a list of squares for numbers from 1 to 10."],
|
98 |
-
["Recommend some popular science fiction books."],
|
99 |
-
["Can you write a short story about a time-traveling detective?"]
|
100 |
],
|
101 |
additional_inputs_accordion=gr.Accordion(label="⚙️ Parameters", open=False),
|
102 |
additional_inputs=[
|
|
|
74 |
# Load model
|
75 |
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
|
76 |
quantization_config = BitsAndBytesConfig(
|
77 |
+
load_in_4bit=False,
|
78 |
bnb_4bit_compute_dtype=torch.bfloat16
|
79 |
)
|
80 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
|
|
91 |
title=EMOJI + " " + MODEL_NAME,
|
92 |
description=DESCRIPTION,
|
93 |
examples=[
|
94 |
+
["Express joy and excitement about visiting a new place."],
|
95 |
+
["I'm feeling really down today. Nothing seems to be going right."],
|
96 |
+
["hey, How are you and what is your name?"],
|
|
|
|
|
|
|
97 |
],
|
98 |
additional_inputs_accordion=gr.Accordion(label="⚙️ Parameters", open=False),
|
99 |
additional_inputs=[
|