Spaces:

dvruette
/

concept-guidance

Sleeping

dvruette commited on Feb 23

Commit

6ea89ff

•

1 Parent(s): cb15a9e

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -5,6 +5,7 @@ from threading import Thread
 import time
 import torch
 import gradio as gr
 from concept_guidance.chat_template import DEFAULT_CHAT_TEMPLATE
 from concept_guidance.patching import patch_model, load_weights
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline, TextIteratorStreamer, Conversation
@@ -12,8 +13,9 @@ from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline, TextIter
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # device = "cpu"
 # comment in/out the models you want to use
 # RAM requirements: ~16GB x #models (+ ~4GB overhead)
@@ -86,6 +88,7 @@ def add_user_prompt(user_message, history):
     history.append([user_message, None])
     return history
 @torch.no_grad()
 def generate_completion(
     history,

 import time
 import torch
 import gradio as gr
+import spaces
 from concept_guidance.chat_template import DEFAULT_CHAT_TEMPLATE
 from concept_guidance.patching import patch_model, load_weights
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline, TextIteratorStreamer, Conversation
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+# device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # device = "cpu"
+device = "cuda"
 # comment in/out the models you want to use
 # RAM requirements: ~16GB x #models (+ ~4GB overhead)
     history.append([user_message, None])
     return history
+@spaces.GPU
 @torch.no_grad()
 def generate_completion(
     history,