pmolchanov commited on
Commit
57d8da9
·
verified ·
1 Parent(s): ee30c97

Update app_chat.py

Browse files
Files changed (1) hide show
  1. app_chat.py +5 -1
app_chat.py CHANGED
@@ -83,8 +83,12 @@ def generate(
83
  top_k=top_k,
84
  temperature=temperature,
85
  num_beams=1,
 
86
  repetition_penalty=repetition_penalty,
87
- "stopping_criteria": stopping_criteria,
 
 
 
88
  )
89
  t = Thread(target=model.generate, kwargs=generate_kwargs)
90
  t.start()
 
83
  top_k=top_k,
84
  temperature=temperature,
85
  num_beams=1,
86
+ use_cache = True,
87
  repetition_penalty=repetition_penalty,
88
+ stopping_criteria = stopping_criteria,
89
+ attention_mask = torch.ones_like(tokenized_chat), # Add this
90
+ position_ids = None,
91
+ kv_last_layer = None,
92
  )
93
  t = Thread(target=model.generate, kwargs=generate_kwargs)
94
  t.start()