Spaces:
Sleeping
Sleeping
set zephyr model to be the main
Browse files
app.py
CHANGED
@@ -29,58 +29,16 @@ ROLE_PRESETS = {
|
|
29 |
),
|
30 |
}
|
31 |
|
32 |
-
# ----------------
|
33 |
-
|
34 |
-
"Friendly Chatbot": [
|
35 |
-
"Explain embeddings in one paragraph.",
|
36 |
-
"What's a neat productivity trick for engineers?"
|
37 |
-
],
|
38 |
-
"Dataset Auditor": [
|
39 |
-
"10k images (cats/dogs/birds). First-pass audit plan?",
|
40 |
-
"Class imbalance & duplicates: quick remediation checklist."
|
41 |
-
],
|
42 |
-
"SQL Explainer": [
|
43 |
-
"Explain for a PM:\nSELECT u.name, COUNT(*) c FROM orders o JOIN users u ON u.id=o.user_id GROUP BY u.name HAVING COUNT(*)>5;",
|
44 |
-
"What does this CTE do and why use it?"
|
45 |
-
],
|
46 |
-
"Code Reviewer": [
|
47 |
-
"Review Python for edge cases:\n\ndef top_k(nums, k):\n return sorted(nums)[-k:]",
|
48 |
-
"Find race conditions in this multi-threaded write snippet."
|
49 |
-
],
|
50 |
-
"Data Pipeline Doctor": [
|
51 |
-
"ETL fails randomly after 10k rows out of 2M. Where to look first?",
|
52 |
-
"Parquet load spikes memory; pragmatic fixes?"
|
53 |
-
],
|
54 |
-
"Data Engineering Advisor": [
|
55 |
-
"Design a batch + streaming pipeline for clickstream analytics.",
|
56 |
-
"What’s the best way to partition a large parquet dataset for Athena?"
|
57 |
-
],
|
58 |
-
"ML Dataset Preparer": [
|
59 |
-
"Steps to prepare a face recognition dataset from raw videos.",
|
60 |
-
"Best augmentation methods for small medical image datasets?"
|
61 |
-
],
|
62 |
-
"Data Quality Analyst": [
|
63 |
-
"Detect anomalies in tabular data with numerical and categorical columns.",
|
64 |
-
"Checklist for ensuring schema consistency across multiple CSV files."
|
65 |
-
],
|
66 |
-
}
|
67 |
-
|
68 |
-
# ---------------- Models ----------------
|
69 |
-
DEFAULT_MODELS = [
|
70 |
-
"HuggingFaceH4/zephyr-7b-beta",
|
71 |
-
"meta-llama/Meta-Llama-3-8B-Instruct",
|
72 |
-
"mistralai/Mistral-7B-Instruct-v0.3",
|
73 |
-
"Qwen/Qwen2.5-7B-Instruct",
|
74 |
-
"google/gemma-2-9b-it",
|
75 |
-
]
|
76 |
|
77 |
# ---------------- Client factory ----------------
|
78 |
-
def get_client(
|
79 |
token = os.getenv("HF_TOKEN") # optional
|
80 |
-
return InferenceClient(model=
|
81 |
|
82 |
# ---------------- Chat backend (streaming) ----------------
|
83 |
-
def stream_reply(message, history, role, system_message
|
84 |
sys_msg = (system_message or "").strip() or ROLE_PRESETS.get(role, "")
|
85 |
messages = [{"role": "system", "content": sys_msg}]
|
86 |
for u, a in history:
|
@@ -90,16 +48,10 @@ def stream_reply(message, history, role, system_message, model_name, max_tokens,
|
|
90 |
messages.append({"role": "assistant", "content": a})
|
91 |
messages.append({"role": "user", "content": message})
|
92 |
|
93 |
-
client = get_client(
|
94 |
partial = ""
|
95 |
try:
|
96 |
-
for event in client.chat_completion(
|
97 |
-
messages=messages,
|
98 |
-
stream=True,
|
99 |
-
max_tokens=max_tokens,
|
100 |
-
temperature=temperature,
|
101 |
-
top_p=top_p,
|
102 |
-
):
|
103 |
delta = event.choices[0].delta.content or ""
|
104 |
if delta:
|
105 |
partial += delta
|
@@ -108,23 +60,15 @@ def stream_reply(message, history, role, system_message, model_name, max_tokens,
|
|
108 |
yield f"⚠️ Inference error: {e}"
|
109 |
|
110 |
# ---------------- UI ----------------
|
111 |
-
with gr.Blocks(title="HF Chat • Data Roles") as demo:
|
112 |
-
gr.Markdown("## 🤗
|
113 |
|
114 |
-
|
115 |
-
|
116 |
-
|
117 |
-
|
118 |
-
|
119 |
-
|
120 |
-
)
|
121 |
-
model_dd = gr.Dropdown(
|
122 |
-
label="Model (type any HF model ID)",
|
123 |
-
choices=DEFAULT_MODELS,
|
124 |
-
value=DEFAULT_MODELS[0],
|
125 |
-
allow_custom_value=True,
|
126 |
-
interactive=True,
|
127 |
-
)
|
128 |
|
129 |
system_tb = gr.Textbox(
|
130 |
label="System message (auto-filled by role; you can edit)",
|
@@ -132,38 +76,14 @@ with gr.Blocks(title="HF Chat • Data Roles") as demo:
|
|
132 |
lines=4,
|
133 |
)
|
134 |
|
135 |
-
with gr.Accordion("Examples for selected role", open=False):
|
136 |
-
ex_radio = gr.Radio(
|
137 |
-
label="Pick an example to insert into the input",
|
138 |
-
choices=ROLE_EXAMPLES["Friendly Chatbot"],
|
139 |
-
interactive=True,
|
140 |
-
)
|
141 |
-
insert_btn = gr.Button("Insert example into input")
|
142 |
-
|
143 |
chat = gr.ChatInterface(
|
144 |
fn=stream_reply,
|
145 |
-
additional_inputs=[
|
146 |
-
role_dd,
|
147 |
-
system_tb,
|
148 |
-
model_dd,
|
149 |
-
gr.Slider(1, 2048, value=512, step=1, label="Max new tokens"),
|
150 |
-
gr.Slider(0.0, 2.0, value=0.7, step=0.1, label="Temperature"),
|
151 |
-
gr.Slider(0.0, 1.0, value=0.95, step=0.05, label="Top-p"),
|
152 |
-
],
|
153 |
)
|
154 |
|
155 |
def _on_role_change(role):
|
156 |
return ROLE_PRESETS.get(role, "")
|
157 |
role_dd.change(fn=_on_role_change, inputs=role_dd, outputs=system_tb)
|
158 |
|
159 |
-
def _examples_for_role(role):
|
160 |
-
items = ROLE_EXAMPLES.get(role, [])
|
161 |
-
return gr.update(choices=items, value=(items[0] if items else None))
|
162 |
-
role_dd.change(fn=_examples_for_role, inputs=role_dd, outputs=ex_radio)
|
163 |
-
|
164 |
-
def _insert_example(example_text):
|
165 |
-
return gr.update(value=example_text or "")
|
166 |
-
insert_btn.click(fn=_insert_example, inputs=ex_radio, outputs=chat.textbox)
|
167 |
-
|
168 |
if __name__ == "__main__":
|
169 |
-
demo.launch()
|
|
|
29 |
),
|
30 |
}
|
31 |
|
32 |
+
# ---------------- Model ----------------
|
33 |
+
MODEL_NAME = "HuggingFaceH4/zephyr-7b-beta"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
34 |
|
35 |
# ---------------- Client factory ----------------
|
36 |
+
def get_client():
|
37 |
token = os.getenv("HF_TOKEN") # optional
|
38 |
+
return InferenceClient(model=MODEL_NAME, token=token)
|
39 |
|
40 |
# ---------------- Chat backend (streaming) ----------------
|
41 |
+
def stream_reply(message, history, role, system_message):
|
42 |
sys_msg = (system_message or "").strip() or ROLE_PRESETS.get(role, "")
|
43 |
messages = [{"role": "system", "content": sys_msg}]
|
44 |
for u, a in history:
|
|
|
48 |
messages.append({"role": "assistant", "content": a})
|
49 |
messages.append({"role": "user", "content": message})
|
50 |
|
51 |
+
client = get_client()
|
52 |
partial = ""
|
53 |
try:
|
54 |
+
for event in client.chat_completion(messages=messages, stream=True):
|
|
|
|
|
|
|
|
|
|
|
|
|
55 |
delta = event.choices[0].delta.content or ""
|
56 |
if delta:
|
57 |
partial += delta
|
|
|
60 |
yield f"⚠️ Inference error: {e}"
|
61 |
|
62 |
# ---------------- UI ----------------
|
63 |
+
with gr.Blocks(title="HF Zephyr Chat • Data Roles") as demo:
|
64 |
+
gr.Markdown("## 🤗 Zephyr Chat (Data-focused Roles)")
|
65 |
|
66 |
+
role_dd = gr.Dropdown(
|
67 |
+
label="Role preset",
|
68 |
+
choices=list(ROLE_PRESETS.keys()),
|
69 |
+
value="Friendly Chatbot",
|
70 |
+
interactive=True,
|
71 |
+
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
72 |
|
73 |
system_tb = gr.Textbox(
|
74 |
label="System message (auto-filled by role; you can edit)",
|
|
|
76 |
lines=4,
|
77 |
)
|
78 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
79 |
chat = gr.ChatInterface(
|
80 |
fn=stream_reply,
|
81 |
+
additional_inputs=[role_dd, system_tb],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
82 |
)
|
83 |
|
84 |
def _on_role_change(role):
|
85 |
return ROLE_PRESETS.get(role, "")
|
86 |
role_dd.change(fn=_on_role_change, inputs=role_dd, outputs=system_tb)
|
87 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
88 |
if __name__ == "__main__":
|
89 |
+
demo.launch()
|