tranquilkd commited on
Commit
197cc57
·
1 Parent(s): fd4433f

update app.py & requirements

Browse files
Files changed (2) hide show
  1. app.py +10 -12
  2. requirements.txt +1 -2
app.py CHANGED
@@ -2,30 +2,28 @@ import os
2
  import torch
3
  import gradio as gr
4
  from peft import PeftModel, PeftConfig
5
- from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig
6
 
7
 
8
  def load_model(model_path):
9
  config = PeftConfig.from_pretrained(model_path)
10
 
11
- bnb_config = BitsAndBytesConfig(
12
- load_in_4bit=True,
13
- bnb_4bit_quant_type="nf4",
14
- bnb_4bit_compute_dtype=torch.float16,
15
- )
16
-
17
- model = AutoModelForCausalLM.from_pretrained(
18
  config.base_model_name_or_path,
19
- quantization_config=bnb_config,
20
  trust_remote_code=True,
21
- token=os.environ["HF_TOKEN"],
22
  )
23
- model.config.use_cache = False
 
24
  tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)
25
  tokenizer.pad_token = tokenizer.eos_token
26
 
27
  # Load the Lora model
28
- model = PeftModel.from_pretrained(model, model_path)
 
 
 
 
29
 
30
  return model, tokenizer
31
 
 
2
  import torch
3
  import gradio as gr
4
  from peft import PeftModel, PeftConfig
5
+ from transformers import AutoModelForCausalLM, AutoTokenizer
6
 
7
 
8
  def load_model(model_path):
9
  config = PeftConfig.from_pretrained(model_path)
10
 
11
+ base_model = AutoModelForCausalLM.from_pretrained(
 
 
 
 
 
 
12
  config.base_model_name_or_path,
 
13
  trust_remote_code=True,
14
+ # token=os.environ["HF_TOKEN"],
15
  )
16
+
17
+ base_model.config.use_cache = False
18
  tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)
19
  tokenizer.pad_token = tokenizer.eos_token
20
 
21
  # Load the Lora model
22
+ model = PeftModel.from_pretrained(
23
+ base_model,
24
+ model_path,
25
+ low_cpu_mem_usage=True
26
+ )
27
 
28
  return model, tokenizer
29
 
requirements.txt CHANGED
@@ -1,5 +1,4 @@
1
  torch
2
  transformers
3
  peft
4
- gradio
5
- bitsandbytes
 
1
  torch
2
  transformers
3
  peft
4
+ gradio