Spaces:

r1208
/

c4ai-command-r-v01-4bit_32r

Sleeping

r1208 commited on Jun 8, 2024

Commit

320473d

verified ·

1 Parent(s): bfe1ea4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,14 +18,15 @@ from peft import AutoPeftModelForCausalLM
 from transformers import AutoTokenizer
 import torch
-attn_implementation = None
-if USE_FLASH_ATTENTION:
-  attn_implementation="flash_attention_2"
 model_id = "r1208/c4ai-command-r-v01-4bit_32r"
-model = AutoPeftModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.bfloat16, attn_implementation=attn_implementation,)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 tokenizer_with_prefix_space = AutoTokenizer.from_pretrained(model_id, add_prefix_space=True)

 from transformers import AutoTokenizer
 import torch
+# attn_implementation = None
+# USE_FLASH_ATTENTION = False
+# if USE_FLASH_ATTENTION:
+#   attn_implementation="flash_attention_2"
 model_id = "r1208/c4ai-command-r-v01-4bit_32r"
+model = AutoPeftModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.bfloat16)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 tokenizer_with_prefix_space = AutoTokenizer.from_pretrained(model_id, add_prefix_space=True)