matthoffner commited on
Commit
6e9b600
ยท
1 Parent(s): 58d7dae

Update demo.py

Browse files
Files changed (1) hide show
  1. demo.py +2 -2
demo.py CHANGED
@@ -4,7 +4,7 @@ import gradio as gr
4
 
5
 
6
  llm = AutoModelForCausalLM.from_pretrained("TheBloke/falcon-7b-instruct-GGML", model_file="falcon7b-instruct.ggmlv3.q4_0.bin",
7
- model_type="falcon", threads=20)
8
 
9
 
10
  TITLE = """<h2 align="center">๐Ÿ•Š๏ธ Falcon-Chat ggml ๐Ÿ•Š๏ธ"""
@@ -198,5 +198,5 @@ def get_demo():
198
 
199
  if __name__ == "__main__":
200
  demo = get_demo()
201
- demo.queue(max_size=128, concurrency_count=10)
202
  demo.launch(server_name="0.0.0.0", server_port=7860)
 
4
 
5
 
6
  llm = AutoModelForCausalLM.from_pretrained("TheBloke/falcon-7b-instruct-GGML", model_file="falcon7b-instruct.ggmlv3.q4_0.bin",
7
+ model_type="falcon", threads=8)
8
 
9
 
10
  TITLE = """<h2 align="center">๐Ÿ•Š๏ธ Falcon-Chat ggml ๐Ÿ•Š๏ธ"""
 
198
 
199
  if __name__ == "__main__":
200
  demo = get_demo()
201
+ demo.queue(max_size=128, concurrency_count=8)
202
  demo.launch(server_name="0.0.0.0", server_port=7860)