Spaces:

AstroMLab
/

AstroSage-8B

Runtime error

Tijmen2 commited on Nov 20, 2024

Commit

d8c999b

verified ·

1 Parent(s): da4a62d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,13 +9,18 @@ model_path = hf_hub_download(
     filename="AstroSage-8B-Q8_0.gguf"
 )
-llm = Llama(
-    model_path=model_path,
-    n_ctx=2048,
-    chat_format="llama-3",
-    n_gpu_layers=-1,  # ensure all layers are on GPU
-    split_mode=0,
-)
 # Placeholder responses for when context is empty
 GREETING_MESSAGES = [

     filename="AstroSage-8B-Q8_0.gguf"
 )
+@space.GPU
+def load_llm():
+    llm = Llama(
+        model_path=model_path,
+        n_ctx=2048,
+        chat_format="llama-3",
+        n_gpu_layers=-1,  # ensure all layers are on GPU
+        split_mode=0,
+    )
+    return llm
+llm = load_llm()
 # Placeholder responses for when context is empty
 GREETING_MESSAGES = [