RomZay commited on
Commit
7eb1fb9
·
verified ·
1 Parent(s): 3ead084

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +32 -32
app.py CHANGED
@@ -1,11 +1,15 @@
1
  import gradio as gr
2
- from huggingface_hub import InferenceClient
 
 
3
 
4
- """
5
- For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
6
- """
7
- client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
8
 
 
 
 
 
9
 
10
  def respond(
11
  message,
@@ -13,10 +17,9 @@ def respond(
13
  system_message,
14
  max_tokens,
15
  temperature,
16
- top_p,
17
  ):
18
- messages = [{"role": "system", "content": system_message}]
19
-
20
  for val in history:
21
  if val[0]:
22
  messages.append({"role": "user", "content": val[0]})
@@ -25,19 +28,24 @@ def respond(
25
 
26
  messages.append({"role": "user", "content": message})
27
 
28
- response = ""
29
-
30
- for message in client.chat_completion(
31
- messages,
32
- max_tokens=max_tokens,
33
- stream=True,
34
- temperature=temperature,
35
- top_p=top_p,
36
- ):
37
- token = message.choices[0].delta.content
38
-
39
- response += token
40
- yield response
 
 
 
 
 
41
 
42
  """
43
  For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
@@ -45,19 +53,11 @@ For information on how to customize the ChatInterface, peruse the gradio docs: h
45
  demo = gr.ChatInterface(
46
  respond,
47
  additional_inputs=[
48
- gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
49
  gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
50
- gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
51
- gr.Slider(
52
- minimum=0.1,
53
- maximum=1.0,
54
- value=0.95,
55
- step=0.05,
56
- label="Top-p (nucleus sampling)",
57
- ),
58
  ],
59
  )
60
 
61
-
62
  if __name__ == "__main__":
63
- demo.launch()
 
1
  import gradio as gr
2
+ import requests
3
+ import json
4
+ import os
5
 
6
+ API_URL = "https://host.palple.polrambora.com/pmsq"
7
+ API_TOKEN = os.getenv("POLLY")
 
 
8
 
9
+ headers = {
10
+ "Authorization": f"{API_TOKEN}",
11
+ "Content-Type": "application/json",
12
+ }
13
 
14
  def respond(
15
  message,
 
17
  system_message,
18
  max_tokens,
19
  temperature,
 
20
  ):
21
+ messages = []
22
+
23
  for val in history:
24
  if val[0]:
25
  messages.append({"role": "user", "content": val[0]})
 
28
 
29
  messages.append({"role": "user", "content": message})
30
 
31
+ data = {
32
+ "preferences": {
33
+ "max_tokens": max_tokens,
34
+ "temperature": temperature,
35
+ "system_message": system_message
36
+ },
37
+ "conversation_history": history,
38
+ "input": message
39
+ }
40
+
41
+ response = requests.post(API_URL, headers=headers, data=json.dumps(data))
42
+ response_json = response.json()
43
+
44
+ if response.status_code == 200:
45
+ generated_text = response_json.msq.message[0]
46
+ yield generated_text
47
+ else:
48
+ yield "Error: " + response_json.get("error", "Unknown error occurred.")
49
 
50
  """
51
  For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
 
53
  demo = gr.ChatInterface(
54
  respond,
55
  additional_inputs=[
56
+ gr.Textbox(value="You are PMSQ", label="System message"),
57
  gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
58
+ gr.Slider(minimum=0.1, maximum=4.0, value=0.3, step=0.1, label="Temperature"),
 
 
 
 
 
 
 
59
  ],
60
  )
61
 
 
62
  if __name__ == "__main__":
63
+ demo.launch()