Spaces:

GaborToth2
/

chat

Sleeping

GaborToth2 commited on Mar 10

Commit

6ea52a1

1 Parent(s): e7a6ee0

secret set on HF

Files changed (3) hide show

app.py CHANGED Viewed

@@ -1,11 +1,11 @@
-import gradio as gr
 from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
 models = ["HuggingFaceH4/zephyr-7b-beta", "microsoft/Phi-4-mini-instruct"]
-client = InferenceClient(model=models[1])
 def respond(
@@ -16,7 +16,7 @@ def respond(
     temperature,
     top_p,
 ):
-    messages = [{"role": "system", "content": system_message}]
     for val in history:
         if val[0]:

+import os
 from huggingface_hub import InferenceClient
+HF_API_KEY = os.getenv("HF_API_KEY")  # Retrieve API key from environment variable
 models = ["HuggingFaceH4/zephyr-7b-beta", "microsoft/Phi-4-mini-instruct"]
+client = InferenceClient(model=models[1], token=HF_API_KEY)  # Pass API key to client
 def respond(
     temperature,
     top_p,
 ):
+         = [{"role": "system", "content": system_message}]
     for val in history:
         if val[0]:

asd.py → gradio_local.py RENAMED Viewed

File without changes

model_local.py ADDED Viewed

+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+model_name = "microsoft/Phi-4-mini-instruct"
+# Load model and tokenizer
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16, device_map="auto")
+# Generate a response
+def chat_with_model(prompt, max_new_tokens=100):
+    inputs = tokenizer(prompt, return_tensors="pt").to("cpu")  # Move to GPU if available
+    output = model.generate(**inputs, max_new_tokens=max_new_tokens)
+    return tokenizer.decode(output[0], skip_special_tokens=True)
+# Test the model
+user_input = "Explain quantum computing in simple terms."
+response = chat_with_model(user_input)
+print("Chatbot Response:", response)