Update app.py
Browse files
app.py
CHANGED
@@ -38,7 +38,7 @@ class MyModel:
|
|
38 |
# )
|
39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
41 |
-
client = AutoPeftModelForCausalLM.from_pretrained(model
|
42 |
|
43 |
self.client = client
|
44 |
self.tokenizer = tokenizer
|
|
|
38 |
# )
|
39 |
# FastLanguageModel.for_inference(client) # Enable native 2x faster inference
|
40 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
41 |
+
client = AutoPeftModelForCausalLM.from_pretrained(model) #, load_in_4bit=True)
|
42 |
|
43 |
self.client = client
|
44 |
self.tokenizer = tokenizer
|