MyNameIsSimon commited on
Commit
3187f15
·
1 Parent(s): 466ab94
Files changed (2) hide show
  1. app.py +1 -1
  2. requirements.txt +2 -2
app.py CHANGED
@@ -38,7 +38,7 @@ class MyModel:
38
  # )
39
  # FastLanguageModel.for_inference(client) # Enable native 2x faster inference
40
  tokenizer = AutoTokenizer.from_pretrained(model)
41
- client = AutoPeftModelForCausalLM.from_pretrained(model) #, load_in_4bit=True)
42
 
43
  self.client = client
44
  self.tokenizer = tokenizer
 
38
  # )
39
  # FastLanguageModel.for_inference(client) # Enable native 2x faster inference
40
  tokenizer = AutoTokenizer.from_pretrained(model)
41
+ client = AutoPeftModelForCausalLM.from_pretrained(model, load_in_4bit=True)
42
 
43
  self.client = client
44
  self.tokenizer = tokenizer
requirements.txt CHANGED
@@ -1,5 +1,5 @@
1
  huggingface_hub==0.25.2
2
  transformers>=4.45.1
3
- torch
4
  peft
5
- https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_multi-backend-refactor/bitsandbytes-0.44.1.dev0-py3-none-manylinux_2_24_x86_64.whl
 
 
1
  huggingface_hub==0.25.2
2
  transformers>=4.45.1
 
3
  peft
4
+ torch
5
+ #https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_multi-backend-refactor/bitsandbytes-0.44.1.dev0-py3-none-manylinux_2_24_x86_64.whl