praeclarumjj3 commited on
Commit
8cc0ab8
·
1 Parent(s): 3430dd6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +23 -21
app.py CHANGED
@@ -50,7 +50,7 @@ def load_demo_refresh_model_list(request: gr.Request):
50
  state = default_conversation.copy()
51
  dropdown_update = gr.Dropdown.update(
52
  choices=models,
53
- value=models[0] if len(models) > 0 else ""
54
  )
55
  return state, dropdown_update
56
 
@@ -183,27 +183,27 @@ def http_bot(state, model_selector, temperature, top_p, max_new_tokens, request:
183
  yield (state, state.to_gradio_chatbot()) + (disable_btn,) * 5
184
 
185
 
186
- # try:
187
  # Stream output
188
- response = chat.generate_stream_gate(pload)
189
- for chunk in response:
190
- if chunk:
191
- data = json.loads(chunk.decode())
192
- if data["error_code"] == 0:
193
- output = data["text"][len(prompt):].strip()
194
- state.messages[-1][-1] = output + "▌"
195
- yield (state, state.to_gradio_chatbot()) + (disable_btn,) * 5
196
- else:
197
- output = data["text"] + f" (error_code: {data['error_code']})"
198
- state.messages[-1][-1] = output
199
- yield (state, state.to_gradio_chatbot()) + (disable_btn, disable_btn, disable_btn, enable_btn, enable_btn)
200
- return
201
- time.sleep(0.03)
202
- # except Exception:
203
- # gr.Warning(server_error_msg)
204
- # state.messages[-1][-1] = server_error_msg
205
- # yield (state, state.to_gradio_chatbot()) + (disable_btn, disable_btn, disable_btn, enable_btn, enable_btn)
206
- # return
207
 
208
  state.messages[-1][-1] = state.messages[-1][-1][:-1]
209
  yield (state, state.to_gradio_chatbot()) + (enable_btn,) * 5
@@ -372,6 +372,8 @@ if __name__ == "__main__":
372
  model_name = args.model_name
373
 
374
  models = [model_name]
 
 
375
  chat = Chat(
376
  args.model_path,
377
  args.model_base,
 
50
  state = default_conversation.copy()
51
  dropdown_update = gr.Dropdown.update(
52
  choices=models,
53
+ value=models[0]+"-4bit" if len(models) > 0 else ""
54
  )
55
  return state, dropdown_update
56
 
 
183
  yield (state, state.to_gradio_chatbot()) + (disable_btn,) * 5
184
 
185
 
186
+ try:
187
  # Stream output
188
+ response = chat.generate_stream_gate(pload)
189
+ for chunk in response:
190
+ if chunk:
191
+ data = json.loads(chunk.decode())
192
+ if data["error_code"] == 0:
193
+ output = data["text"][len(prompt):].strip()
194
+ state.messages[-1][-1] = output + "▌"
195
+ yield (state, state.to_gradio_chatbot()) + (disable_btn,) * 5
196
+ else:
197
+ output = data["text"] + f" (error_code: {data['error_code']})"
198
+ state.messages[-1][-1] = output
199
+ yield (state, state.to_gradio_chatbot()) + (disable_btn, disable_btn, disable_btn, enable_btn, enable_btn)
200
+ return
201
+ time.sleep(0.03)
202
+ except Exception:
203
+ gr.Warning(server_error_msg)
204
+ state.messages[-1][-1] = server_error_msg
205
+ yield (state, state.to_gradio_chatbot()) + (disable_btn, disable_btn, disable_btn, enable_btn, enable_btn)
206
+ return
207
 
208
  state.messages[-1][-1] = state.messages[-1][-1][:-1]
209
  yield (state, state.to_gradio_chatbot()) + (enable_btn,) * 5
 
372
  model_name = args.model_name
373
 
374
  models = [model_name]
375
+ args.load_4bit = True
376
+
377
  chat = Chat(
378
  args.model_path,
379
  args.model_base,