Commit
·
3187f15
1
Parent(s):
466ab94
test
Browse files- app.py +1 -1
- requirements.txt +2 -2
app.py
CHANGED
@@ -38,7 +38,7 @@ class MyModel:
|
|
38 |
# )
|
39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
41 |
-
client = AutoPeftModelForCausalLM.from_pretrained(model
|
42 |
|
43 |
self.client = client
|
44 |
self.tokenizer = tokenizer
|
|
|
38 |
# )
|
39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
41 |
+
client = AutoPeftModelForCausalLM.from_pretrained(model, load_in_4bit=True)
|
42 |
|
43 |
self.client = client
|
44 |
self.tokenizer = tokenizer
|
requirements.txt
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
huggingface_hub==0.25.2
|
2 |
transformers>=4.45.1
|
3 |
-
torch
|
4 |
peft
|
5 |
-
|
|
|
|
1 |
huggingface_hub==0.25.2
|
2 |
transformers>=4.45.1
|
|
|
3 |
peft
|
4 |
+
torch
|
5 |
+
#https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_multi-backend-refactor/bitsandbytes-0.44.1.dev0-py3-none-manylinux_2_24_x86_64.whl
|