Spaces:
Runtime error
Runtime error
fix streaming
Browse files
app.py
CHANGED
@@ -58,11 +58,15 @@ def predict(message, history, system_prompt, temperature, top_p, top_k, frequenc
|
|
58 |
content = json_data['choices'][0]['delta'].get('content', '')
|
59 |
if content:
|
60 |
partial_message += content
|
|
|
|
|
61 |
yield partial_message
|
62 |
except json.JSONDecodeError:
|
63 |
continue
|
64 |
|
65 |
if partial_message:
|
|
|
|
|
66 |
yield partial_message
|
67 |
|
68 |
except RequestException as e:
|
@@ -135,6 +139,8 @@ with gr.Blocks(theme='gradio/monochrome') as demo:
|
|
135 |
max_tokens = gr.Slider(1, 1024, value=256, step=1, label="Max Output (max_tokens)")
|
136 |
|
137 |
def user(user_message, history):
|
|
|
|
|
138 |
return "", history + [[user_message, None]]
|
139 |
|
140 |
def bot(history, system_prompt, temperature, top_p, top_k, frequency_penalty, presence_penalty, repetition_penalty, max_tokens):
|
|
|
58 |
content = json_data['choices'][0]['delta'].get('content', '')
|
59 |
if content:
|
60 |
partial_message += content
|
61 |
+
|
62 |
+
print(f"<|assistant|>\n{partial_message}\n")
|
63 |
yield partial_message
|
64 |
except json.JSONDecodeError:
|
65 |
continue
|
66 |
|
67 |
if partial_message:
|
68 |
+
|
69 |
+
print(f"<|assistant|>\n{partial_message}\n")
|
70 |
yield partial_message
|
71 |
|
72 |
except RequestException as e:
|
|
|
139 |
max_tokens = gr.Slider(1, 1024, value=256, step=1, label="Max Output (max_tokens)")
|
140 |
|
141 |
def user(user_message, history):
|
142 |
+
|
143 |
+
print(f"<|user|>\n{user_message}\n")
|
144 |
return "", history + [[user_message, None]]
|
145 |
|
146 |
def bot(history, system_prompt, temperature, top_p, top_k, frequency_penalty, presence_penalty, repetition_penalty, max_tokens):
|