Update app.py
Browse files
app.py
CHANGED
@@ -71,8 +71,8 @@ def generator(input_ids, generation_config, max_new_tokens):
|
|
71 |
def loadModel():
|
72 |
global model, tokenizer
|
73 |
if model is None:
|
74 |
-
|
75 |
-
|
76 |
model = transformers.AutoModelForCausalLM.from_pretrained(
|
77 |
base_model,
|
78 |
torch_dtype=torch.float16,
|
|
|
71 |
def loadModel():
|
72 |
global model, tokenizer
|
73 |
if model is None:
|
74 |
+
from llama_rope_scaled_monkey_patch import replace_llama_rope_with_scaled_rope
|
75 |
+
replace_llama_rope_with_scaled_rope()
|
76 |
model = transformers.AutoModelForCausalLM.from_pretrained(
|
77 |
base_model,
|
78 |
torch_dtype=torch.float16,
|