matthoffner commited on
Commit
6e9b600
β€’
1 Parent(s): 58d7dae

Update demo.py

Browse files
Files changed (1) hide show
  1. demo.py +2 -2
demo.py CHANGED
@@ -4,7 +4,7 @@ import gradio as gr
4
 
5
 
6
  llm = AutoModelForCausalLM.from_pretrained("TheBloke/falcon-7b-instruct-GGML", model_file="falcon7b-instruct.ggmlv3.q4_0.bin",
7
- model_type="falcon", threads=20)
8
 
9
 
10
  TITLE = """<h2 align="center">πŸ•ŠοΈ Falcon-Chat ggml πŸ•ŠοΈ"""
@@ -198,5 +198,5 @@ def get_demo():
198
 
199
  if __name__ == "__main__":
200
  demo = get_demo()
201
- demo.queue(max_size=128, concurrency_count=10)
202
  demo.launch(server_name="0.0.0.0", server_port=7860)
 
4
 
5
 
6
  llm = AutoModelForCausalLM.from_pretrained("TheBloke/falcon-7b-instruct-GGML", model_file="falcon7b-instruct.ggmlv3.q4_0.bin",
7
+ model_type="falcon", threads=8)
8
 
9
 
10
  TITLE = """<h2 align="center">πŸ•ŠοΈ Falcon-Chat ggml πŸ•ŠοΈ"""
 
198
 
199
  if __name__ == "__main__":
200
  demo = get_demo()
201
+ demo.queue(max_size=128, concurrency_count=8)
202
  demo.launch(server_name="0.0.0.0", server_port=7860)