Update README.md
Browse files
README.md
CHANGED
@@ -1,24 +1,4 @@
|
|
1 |
---
|
2 |
pipeline_tag: text-generation
|
3 |
---
|
4 |
-
7.0 bpw exl2 quant of [CohereForAI/c4ai-command-a-03-2025](https://huggingface.co/CohereForAI/c4ai-command-a-03-2025)
|
5 |
-
|
6 |
-
The following patch from the exllamav2 discord is needed to run command-a:
|
7 |
-
|
8 |
-
```
|
9 |
-
diff --git a/exllamav2/architecture.py b/exllamav2/architecture.py
|
10 |
-
index b2a6280..67db6ef 100644
|
11 |
-
--- a/exllamav2/architecture.py
|
12 |
-
+++ b/exllamav2/architecture.py
|
13 |
-
@@ -496,7 +496,7 @@ class ExLlamaV2ArchParams:
|
14 |
-
|
15 |
-
# Cohere
|
16 |
-
|
17 |
-
- if arch_string == "CohereForCausalLM":
|
18 |
-
+ if arch_string in ("CohereForCausalLM", "Cohere2ForCausalLM"):
|
19 |
-
arch_recognized = True
|
20 |
-
self.lm.layer_keys += \
|
21 |
-
layer_keys_cohere_norms + \
|
22 |
-
```
|
23 |
-
|
24 |
-
(source: https://discord.com/channels/1212998078668472380/1212998079339307070/1350190120833253396)
|
|
|
1 |
---
|
2 |
pipeline_tag: text-generation
|
3 |
---
|
4 |
+
7.0 bpw exl2 quant of [CohereForAI/c4ai-command-a-03-2025](https://huggingface.co/CohereForAI/c4ai-command-a-03-2025)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|