Spaces:

hermi612
/

Medical-Chatbot

Sleeping

hermi612 commited on Mar 13

Commit

aa6deae

verified ·

1 Parent(s): b4329a1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,10 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
 # 使用 Hugging Face Inference API 调用云端模型（无需本地加载）
 # 正确方法1：从环境变量读取
@@ -11,13 +16,22 @@ def medical_chat(user_input, history):
     prompt = f"患者：{user_input}\n医生："
     # 调用云端模型（示例使用微软BioGPT）
-    response = client.text_generation(
         prompt=prompt,
         model="microsoft/BioGPT-Large",
-        max_new_tokens=150,
-        temperature=0.7,
-        repetition_penalty=1.2
     )
     # 提取医生回复部分
     doctor_response = response.split("医生：")[-1].strip()
@@ -40,3 +54,6 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
 # 启动应用（Hugging Face Spaces 会自动处理）
 demo.launch(debug=False)

 import gradio as gr
 from huggingface_hub import InferenceClient
+# 在 app.py 顶部添加
+import os
+os.environ["HF_ENDPOINT"] = "https://hf-mirror.com"  # 中国大陆加速
 # 使用 Hugging Face Inference API 调用云端模型（无需本地加载）
 # 正确方法1：从环境变量读取
     prompt = f"患者：{user_input}\n医生："
     # 调用云端模型（示例使用微软BioGPT）
+from tenacity import retry, stop_after_attempt, wait_exponential
+@retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=2, max=10))
+def safe_model_call(prompt):
+    return client.text_generation(
         prompt=prompt,
         model="microsoft/BioGPT-Large",
+        max_new_tokens=150
     )
+    # response = client.text_generation(
+    #     prompt=prompt,
+    #     model="microsoft/BioGPT-Large",
+    #     max_new_tokens=150,
+    #     temperature=0.7,
+    #     repetition_penalty=1.2
+    # )
     # 提取医生回复部分
     doctor_response = response.split("医生：")[-1].strip()
 # 启动应用（Hugging Face Spaces 会自动处理）
 demo.launch(debug=False)