TurtleLiu commited on
Commit
b4b53db
·
1 Parent(s): c2cedec

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +30 -1
app.py CHANGED
@@ -1,6 +1,35 @@
 
1
  import gradio as gr
 
 
2
 
3
- gr.load("models/TurtleLiu/mistral7b_psychology_bot").launch()
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
 
5
  '''
6
  from huggingface_hub import InferenceClient
 
1
+ from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
2
  import gradio as gr
3
+ import torch
4
+ from peft import PeftConfig, PeftModel
5
 
6
+ # Loading PEFT model
7
+ PEFT_MODEL = "TurtleLiu/mistral7b_psychology_bot"
8
+
9
+ config = PeftConfig.from_pretrained(PEFT_MODEL)
10
+
11
+ bnb_config = BitsAndBytesConfig(
12
+ load_in_4bit= True,
13
+ bnb_4bit_quant_type= "nf4",
14
+ bnb_4bit_compute_dtype= torch.bfloat16,
15
+ bnb_4bit_use_double_quant= False,
16
+ )
17
+
18
+ peft_base_model = AutoModelForCausalLM.from_pretrained(
19
+ config.base_model_name_or_path,
20
+ return_dict=True,
21
+ quantization_config=bnb_config,
22
+ device_map="auto",
23
+ trust_remote_code=True,
24
+ )
25
+
26
+ model = PeftModel.from_pretrained(peft_base_model, PEFT_MODEL)
27
+ model = model.merge_and_unload()
28
+
29
+ # Load tokenizer
30
+ tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path, trust_remote_code=True)
31
+ tokenizer.pad_token = tokenizer.eos_token
32
+ tokenizer.padding_side = "right"
33
 
34
  '''
35
  from huggingface_hub import InferenceClient