Upload README.md with huggingface_hub
Browse files
README.md
CHANGED
@@ -6,7 +6,7 @@ The reference provides the following functional *configurations*:
|
|
6 |
Configuration | Explanation
|
7 |
:-- | :--
|
8 |
**`BASELINE`** | a reference functionally equivalent to the original model
|
9 |
-
**`BASIC`** | all linear algebraic operands quantized to `MXINT8-64
|
10 |
|
11 |
|
12 |
### Usage
|
@@ -28,6 +28,7 @@ pip install -e .
|
|
28 |
from dmx.compressor.modeling import DmxModel
|
29 |
import lm_eval
|
30 |
|
|
|
31 |
model_args = "pretrained=d-matrix/bert-large,trust_remote_code=True"
|
32 |
|
33 |
lm = lm_eval.api.registry.get_model("hf").create_from_arg_string(model_args, {"batch_size": 1})
|
|
|
6 |
Configuration | Explanation
|
7 |
:-- | :--
|
8 |
**`BASELINE`** | a reference functionally equivalent to the original model
|
9 |
+
**`BASIC`** | all linear algebraic operands quantized to `MXINT8-64`
|
10 |
|
11 |
|
12 |
### Usage
|
|
|
28 |
from dmx.compressor.modeling import DmxModel
|
29 |
import lm_eval
|
30 |
|
31 |
+
lm_eval.api.registry.register_model("hf", HFLM)
|
32 |
model_args = "pretrained=d-matrix/bert-large,trust_remote_code=True"
|
33 |
|
34 |
lm = lm_eval.api.registry.get_model("hf").create_from_arg_string(model_args, {"batch_size": 1})
|