LaibaIrfan commited on
Commit
4091725
·
verified ·
1 Parent(s): 3bc4c12

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -12
app.py CHANGED
@@ -13,21 +13,14 @@ FINETUNED_MODEL = "LaibaIrfan/emoji_math"
13
  # Load tokenizer and model
14
  @lru_cache()
15
  def load_model():
16
- tokenizer = AutoTokenizer.from_pretrained(FINETUNED_MODEL)
17
-
18
  base_model = AutoModelForCausalLM.from_pretrained(
19
  BASE_MODEL,
20
- torch_dtype=torch.float16, # Use float16 for efficiency
21
- device_map="auto", # Auto-assign device (GPU if available)
22
- load_in_8bit=True # Reduce memory usage (slightly increases inference time)
23
- )
24
-
25
- model = PeftModel.from_pretrained(
26
- base_model,
27
- FINETUNED_MODEL,
28
- device_map="auto"
29
  )
30
-
31
  return tokenizer, model
32
 
33
  # Load the model
 
13
  # Load tokenizer and model
14
  @lru_cache()
15
  def load_model():
16
+ tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL, trust_remote_code=True) # Use base model tokenizer
 
17
  base_model = AutoModelForCausalLM.from_pretrained(
18
  BASE_MODEL,
19
+ torch_dtype=torch.float16,
20
+ device_map="auto",
21
+ load_in_8bit=True
 
 
 
 
 
 
22
  )
23
+ model = PeftModel.from_pretrained(base_model, FINETUNED_MODEL, device_map="auto")
24
  return tokenizer, model
25
 
26
  # Load the model