zac commited on
Commit
ed5c4cc
·
1 Parent(s): 117600f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -5
app.py CHANGED
@@ -1,8 +1,12 @@
1
  import gradio as gr
2
- from huggingface_hub import hf_hub_download
 
 
3
  from llama_cpp import Llama
 
4
 
5
- llm = Llama(model_path=hf_hub_download(repo_id="TheBloke/airoboros-l2-13b-gpt4-m2.0-GGML", filename="airoboros-l2-13b-gpt4-m2.0.ggmlv3.q6_K.bin"), n_ctx=2048)
 
6
 
7
  history = []
8
  history.append(["Hi there!", "Hello, how can I help you?"])
@@ -30,6 +34,3 @@ demo.launch()
30
 
31
 
32
 
33
-
34
-
35
-
 
1
  import gradio as gr
2
+ import time
3
+ import ctypes #to run on C api directly
4
+ import llama_cpp
5
  from llama_cpp import Llama
6
+ from huggingface_hub import hf_hub_download #load from huggingfaces
7
 
8
+
9
+ llm = Llama(model_path= hf_hub_download(repo_id="TheBloke/airoboros-l2-13b-gpt4-m2.0-GGML", filename="airoboros-l2-13b-gpt4-m2.0.ggmlv3.q6_K.bin"), n_ctx=2048) #download model from hf/ n_ctx=2048 for high ccontext length
10
 
11
  history = []
12
  history.append(["Hi there!", "Hello, how can I help you?"])
 
34
 
35
 
36