Nemo-Mistral-Minitron

Running on Zero

Tonic commited on Sep 17, 2024

Commit

dec5480

unverified ·

1 Parent(s): e10040f

add spaces

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 import json
 from globe import title, description, customtool
 model_path = "nvidia/Nemotron-Mini-4B-Instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_path)
@@ -32,6 +32,7 @@ The current date is 2023-06-01.
     else:
         return f"<extra_id_0>System\n{system_message}\n\n<extra_id_1>User\n{user_message}\n<extra_id_1>Assistant\n"
 def generate_response(message, history, system_message, max_tokens, temperature, top_p, use_pipeline=False, tool_definition=""):
     full_prompt = create_prompt(system_message, message, tool_definition)

 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 import json
 from globe import title, description, customtool
+import spaces
 model_path = "nvidia/Nemotron-Mini-4B-Instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_path)
     else:
         return f"<extra_id_0>System\n{system_message}\n\n<extra_id_1>User\n{user_message}\n<extra_id_1>Assistant\n"
+@spaces.GPU
 def generate_response(message, history, system_message, max_tokens, temperature, top_p, use_pipeline=False, tool_definition=""):
     full_prompt = create_prompt(system_message, message, tool_definition)