Spaces:

AstroMLab
/

AstroSage

Running on Zero

Tijmen2 commited on Nov 18, 2024

Commit

eaf8443

verified ·

1 Parent(s): 3a2a3f4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,19 +4,23 @@ from llama_cpp import Llama
 from huggingface_hub import hf_hub_download
 import random
-# Initialize model
-model_path = hf_hub_download(
-    repo_id="AstroMLab/AstroSage-8B-GGUF",
-    filename="AstroSage-8B-Q8_0.gguf"
-)
-llm = Llama(
-    model_path=model_path,
-    n_ctx=2048,
-    chat_format="llama-3",
-    n_gpu_layers=-1,  # ensure all layers are on GPU
-    flash_attn=True,
-)
 # Placeholder responses for when context is empty
 GREETING_MESSAGES = [

 from huggingface_hub import hf_hub_download
 import random
+@spaces.GPU
+def initialize_model():
+    model_path = hf_hub_download(
+        repo_id="AstroMLab/AstroSage-8B-GGUF",
+        filename="AstroSage-8B-Q8_0.gguf"
+    )
+    llm = Llama(
+        model_path=model_path,
+        n_ctx=2048,
+        chat_format="llama-3",
+        n_gpu_layers=-1,  # ensure all layers are on GPU
+        flash_attn=True,
+    )
+    return llm
+llm = initialize_model()
 # Placeholder responses for when context is empty
 GREETING_MESSAGES = [