Spaces:

AstroMLab
/

AstroSage

Running on Zero

Tijmen2 commited on Nov 20, 2024

Commit

37d0929

verified ·

1 Parent(s): 7320ca6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,17 +9,13 @@ model_path = hf_hub_download(
     filename="AstroSage-8B-Q8_0.gguf"
 )
-@spaces.GPU(duration=119)
-def load_llm():
-    llm = Llama(
-        model_path=model_path,
-        n_ctx=2048,
-        chat_format="llama-3",
-        n_gpu_layers=-1,  # ensure all layers are on GPU
-    )
-    return llm
-llm = load_llm()
 # Placeholder responses for when context is empty
 GREETING_MESSAGES = [

     filename="AstroSage-8B-Q8_0.gguf"
 )
+llm = Llama(
+    model_path=model_path,
+    n_ctx=2048,
+    chat_format="llama-3",
+    n_gpu_layers=-1,  # ensure all layers are on GPU
+)
+return llm
 # Placeholder responses for when context is empty
 GREETING_MESSAGES = [