fastrtc-oauth

Sleeping

App Files Files Community

freddyaboulton HF Staff commited on 10 days ago

Commit

26bc57d

verified ·

1 Parent(s): 229cbd3

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -14

app.py CHANGED Viewed

@@ -6,7 +6,8 @@ from fastrtc import (
     WebRTC,
     WebRTCData,
     WebRTCError,
-    get_cloudflare_turn_credentials,
     get_stt_model,
 )
 from gradio.utils import get_space
@@ -20,13 +21,13 @@ conversations = {}
 def response(
     data: WebRTCData,
     conversation: list[dict],
-    token: str | None = None,
     model: str = "meta-llama/Llama-3.2-3B-Instruct",
     provider: str = "sambanova",
 ):
     print("conversation before", conversation)
-    if not provider.startswith("http") and not token:
-        raise WebRTCError("Please add your HF token.")
     if data.audio is not None and data.audio[1].size > 0:
         user_audio_text = stt_model.stt(data.audio)
@@ -40,7 +41,7 @@ def response(
         client = OpenAI(base_url=provider, api_key="ollama")
     else:
         client = huggingface_hub.InferenceClient(
-            api_key=token,
             provider=provider,  # type: ignore
         )
@@ -95,10 +96,6 @@ with gr.Blocks(css=css) as demo:
         """
     )
     with gr.Sidebar():
-        login = gr.LoginButton()
-        token = gr.Textbox(
-            placeholder="Place your HF token here", type="password", label="HF Token"
-        )
         model = gr.Dropdown(
             choices=["meta-llama/Llama-3.2-3B-Instruct"],
             allow_custom_value=True,
@@ -107,21 +104,23 @@ with gr.Blocks(css=css) as demo:
         provider = gr.Dropdown(
             label="Provider",
             choices=providers,
-            value="sambanova",
             info="Select a hf-compatible provider or type the url of your server, e.g. http://127.0.0.1:11434/v1 for ollama",
             allow_custom_value=True,
         )
-    provider.change(hide_token, inputs=[provider], outputs=[token])
     cb = gr.Chatbot(type="messages", height=600)
     webrtc = WebRTC(
         modality="audio",
         mode="send",
         variant="textbox",
-        rtc_configuration=get_cloudflare_turn_credentials if get_space() else None,
     )
     webrtc.stream(
         ReplyOnPause(response),  # type: ignore
-        inputs=[webrtc, cb, token, model, provider],
         outputs=[cb],
         concurrency_limit=100,
     )
@@ -130,4 +129,4 @@ with gr.Blocks(css=css) as demo:
     )
 if __name__ == "__main__":
-    demo.launch(server_port=7860)

     WebRTC,
     WebRTCData,
     WebRTCError,
+    get_current_context,
+    get_hf_turn_credentials,
     get_stt_model,
 )
 from gradio.utils import get_space
 def response(
     data: WebRTCData,
     conversation: list[dict],
     model: str = "meta-llama/Llama-3.2-3B-Instruct",
     provider: str = "sambanova",
 ):
+    context = get_current_context()
     print("conversation before", conversation)
+    if not provider.startswith("http") and not context.oauth_token:
+        raise WebRTCError("Please Sign in to use this demo.")
     if data.audio is not None and data.audio[1].size > 0:
         user_audio_text = stt_model.stt(data.audio)
         client = OpenAI(base_url=provider, api_key="ollama")
     else:
         client = huggingface_hub.InferenceClient(
+            api_key=context.oauth_token.access_token,  # type: ignore
             provider=provider,  # type: ignore
         )
         """
     )
     with gr.Sidebar():
         model = gr.Dropdown(
             choices=["meta-llama/Llama-3.2-3B-Instruct"],
             allow_custom_value=True,
         provider = gr.Dropdown(
             label="Provider",
             choices=providers,
+            value="auto",
             info="Select a hf-compatible provider or type the url of your server, e.g. http://127.0.0.1:11434/v1 for ollama",
             allow_custom_value=True,
         )
     cb = gr.Chatbot(type="messages", height=600)
     webrtc = WebRTC(
         modality="audio",
         mode="send",
         variant="textbox",
+        rtc_configuration=get_hf_turn_credentials if get_space() else None,
+        server_rtc_configuration=get_hf_turn_credentials(ttl=3_600 * 24 * 30)
+        if get_space()
+        else None,
     )
     webrtc.stream(
         ReplyOnPause(response),  # type: ignore
+        inputs=[webrtc, cb, model, provider],
         outputs=[cb],
         concurrency_limit=100,
     )
     )
 if __name__ == "__main__":
+    demo.launch(server_port=7860)