MohamedRashad commited on
Commit
d19d5db
·
verified ·
1 Parent(s): 7aafef0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -1,11 +1,14 @@
1
  import gradio as gr
2
- from huggingface_hub import InferenceClient
 
3
 
4
  """
5
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
6
  """
7
- client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
8
 
 
 
9
 
10
  def respond(
11
  message,
 
1
  import gradio as gr
2
+ from transformers import AutoTokenizer, AutoModelForCausalLM
3
+ import torch
4
 
5
  """
6
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
7
  """
8
+ # Load model directly
9
 
10
+ tokenizer = AutoTokenizer.from_pretrained("Navid-AI/Mulhem-1-Mini")
11
+ model = AutoModelForCausalLM.from_pretrained("Navid-AI/Mulhem-1-Mini", torch_dtype=torch.bfloat16, device_map="auto", attn_implementation="flash_attention_2", token=os.getenv("HF_TOKEN"))
12
 
13
  def respond(
14
  message,