probablytaha commited on
Commit
6c6793b
·
verified ·
1 Parent(s): 99fa624

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -11,7 +11,7 @@ GGUF_FILENAME = "Dolphin3.0-Llama3.1-8B-Q4_K_S.gguf"
11
  GGUF_DOWNLOAD_URL = f"https://huggingface.co/cognitivecomputations/Dolphin3.0-Llama3.1-8B-GGUF/resolve/main/{GGUF_FILENAME}"
12
 
13
  MODEL_TYPE = "llama"
14
- GPU_LAYERS = 20 # Try -1. If OOM, reduce (20, 15, 10, or 0 for CPU-only)
15
  MAX_NEW_TOKENS = 512
16
  CONTEXT_LENGTH = 4096
17
  TEMPERATURE = 0.7
 
11
  GGUF_DOWNLOAD_URL = f"https://huggingface.co/cognitivecomputations/Dolphin3.0-Llama3.1-8B-GGUF/resolve/main/{GGUF_FILENAME}"
12
 
13
  MODEL_TYPE = "llama"
14
+ GPU_LAYERS = 0 # Try -1. If OOM, reduce (20, 15, 10, or 0 for CPU-only)
15
  MAX_NEW_TOKENS = 512
16
  CONTEXT_LENGTH = 4096
17
  TEMPERATURE = 0.7