Spaces:

seapoe1809
/

darnabot

Sleeping

seapoe1809 commited on Sep 23, 2024

Commit

f90b079

verified ·

1 Parent(s): e98ccdd

Update darnabot.py

Files changed (1) hide show

darnabot.py CHANGED Viewed

@@ -72,15 +72,16 @@ import spaces
 MODEL_LIST = ["mistralai/Mistral-Nemo-Instruct-2407"]
 HF_TOKEN = os.environ.get("HF_TOKEN", None)
 MODEL = os.environ.get("MODEL_ID")
-device = "cuda" if torch.cuda.is_available() else "cpu"  # Use GPU if available, otherwise CPU
 tokenizer = AutoTokenizer.from_pretrained(MODEL)
 model = AutoModelForCausalLM.from_pretrained(
     MODEL,
-    torch_dtype=torch.bfloat16,  # Using bf16 precision
-    device_map="auto",  # Automatically map model to available devices
-    ignore_mismatched_sizes=True  # Allows some flexibility if dimensions don't match
-).to(device)
 async def chat(messages):
     # Convert messages to the format required for the model

 MODEL_LIST = ["mistralai/Mistral-Nemo-Instruct-2407"]
 HF_TOKEN = os.environ.get("HF_TOKEN", None)
 MODEL = os.environ.get("MODEL_ID")
+device = "cuda"
 tokenizer = AutoTokenizer.from_pretrained(MODEL)
 model = AutoModelForCausalLM.from_pretrained(
     MODEL,
+    torch_dtype=torch.bfloat16,
+    device_map="auto",
+    ignore_mismatched_sizes=True)
 async def chat(messages):
     # Convert messages to the format required for the model