BenBranyon commited on
Commit
3675cbb
·
verified ·
1 Parent(s): b85b125

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -0
app.py CHANGED
@@ -4,6 +4,10 @@ from huggingface_hub import InferenceClient
4
  from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
5
 
6
  client = InferenceClient("BenBranyon/zephyr-sumbot-all-songs")
 
 
 
 
7
 
8
 
9
  def respond(
 
4
  from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
5
 
6
  client = InferenceClient("BenBranyon/zephyr-sumbot-all-songs")
7
+ model_id = "BenBranyon/zephyr-sumbot-all-songs"
8
+ model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", load_in_4bit=True)
9
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
10
+ tokenizer.use_default_system_prompt = False
11
 
12
 
13
  def respond(