Spaces:

ericbanzuzi
/

finetuned-llm

Sleeping

ericbanzuzi commited on Dec 3, 2024

Commit

8100cb2

1 Parent(s): f2df5a6

update model

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,15 +1,22 @@
 import gradio as gr
 from llama_cpp import Llama
-from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
-llm = Llama.from_pretrained(
-    repo_id="rcarioniporras/model",
-    filename="*Q4_K_M.gguf",
-    verbose=False
-)
 def respond(
     message,

 import gradio as gr
 from llama_cpp import Llama
+from huggingface_hub import hf_hub_download
+# Download the file from Hugging Face
+model_path = hf_hub_download(repo_id="rcarioniporras/model", filename="unsloth.Q4_K_M.gguf")
+# Load the model using llama_cpp
+llm = Llama(model_path=model_path, verbose=False)
+# """
+# For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
+# """
+# llm = Llama.from_pretrained(
+#     repo_id="rcarioniporras/model",
+#     filename="*Q4_K_M.gguf",
+#     verbose=False
+# )
 def respond(
     message,