drewvid commited on
Commit
e703a5e
·
verified ·
1 Parent(s): 62172b2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +66 -1
app.py CHANGED
@@ -1,3 +1,68 @@
1
  import gradio as gr
 
2
 
3
- gr.load("nold/starcoder2-15b-GGUF").launch()
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  import gradio as gr
2
+ from huggingface_hub import InferenceClient
3
 
4
+ """
5
+ For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
6
+ """
7
+ # client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
8
+ client = InferenceClient("meta-llama/Meta-Llama-3-8B-Instruct")
9
+
10
+
11
+ def respond(
12
+ message,
13
+ history: list[tuple[str, str]],
14
+ max_tokens,
15
+ temperature,
16
+ top_p,
17
+ ):
18
+
19
+ name = "Ernest"
20
+
21
+ system_message = f"""You are an expert programmer called {name}, who knows Python, PHP, CoffeeScript and Javascript. You are to assist users in solving their coding problems."""
22
+
23
+ messages = [{"role": "system", "content": system_message}]
24
+
25
+ for val in history:
26
+ if val[0]:
27
+ messages.append({"role": "user", "content": val[0]})
28
+ if val[1]:
29
+ messages.append({"role": "assistant", "content": val[1]})
30
+
31
+ messages.append({"role": "user", "content": message})
32
+
33
+ response = ""
34
+
35
+ for message in client.chat_completion(
36
+ messages,
37
+ max_tokens=max_tokens,
38
+ stream=True,
39
+ temperature=temperature,
40
+ top_p=top_p,
41
+ ):
42
+ token = message.choices[0].delta.content
43
+
44
+ if token:
45
+ response += token
46
+ yield response
47
+
48
+ """
49
+ For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
50
+ """
51
+ demo = gr.ChatInterface(
52
+ respond,
53
+ additional_inputs=[
54
+ gr.Slider(minimum=1, maximum=8192, value=6144, step=1, label="Max new tokens"),
55
+ gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
56
+ gr.Slider(
57
+ minimum=0.1,
58
+ maximum=1.0,
59
+ value=0.95,
60
+ step=0.05,
61
+ label="Top-p (nucleus sampling)",
62
+ ),
63
+ ],
64
+ )
65
+
66
+
67
+ if __name__ == "__main__":
68
+ demo.launch()