Update app.py
Browse files
app.py
CHANGED
@@ -24,7 +24,6 @@ model_id = "CohereForAI/c4ai-command-r-plus-4bit"
|
|
24 |
|
25 |
|
26 |
|
27 |
-
tokenizer = AutoTokenizer.from_pretrained(model_id, token= token)
|
28 |
|
29 |
#
|
30 |
|
@@ -39,6 +38,8 @@ def respond(
|
|
39 |
temperature,
|
40 |
top_p,
|
41 |
):
|
|
|
|
|
42 |
model = AutoModelForCausalLM.from_pretrained(model_id, token= token,
|
43 |
# torch_dtype=torch.bfloat16,
|
44 |
# attn_implementation="flash_attention_2",
|
|
|
24 |
|
25 |
|
26 |
|
|
|
27 |
|
28 |
#
|
29 |
|
|
|
38 |
temperature,
|
39 |
top_p,
|
40 |
):
|
41 |
+
tokenizer = AutoTokenizer.from_pretrained(model_id, token= token)
|
42 |
+
|
43 |
model = AutoModelForCausalLM.from_pretrained(model_id, token= token,
|
44 |
# torch_dtype=torch.bfloat16,
|
45 |
# attn_implementation="flash_attention_2",
|