Upload README.md with huggingface_hub
Browse files
README.md
CHANGED
@@ -28,7 +28,7 @@ The reference provides the following functional *configurations*:
|
|
28 |
Configuration | Explanation
|
29 |
:-- | :--
|
30 |
**`BASELINE`** | a reference functionally equivalent to the original model
|
31 |
-
**`BASIC`** | all linear algebraic operands quantized to `MXINT8-64
|
32 |
|
33 |
|
34 |
### Usage
|
@@ -49,7 +49,9 @@ pip install -e .
|
|
49 |
```python
|
50 |
from dmx.compressor.modeling import DmxModel
|
51 |
import lm_eval
|
|
|
52 |
|
|
|
53 |
model_args = "pretrained=d-matrix/gpt2-xl,trust_remote_code=True"
|
54 |
|
55 |
lm = lm_eval.api.registry.get_model("hf").create_from_arg_string(model_args, {"batch_size": 1})
|
|
|
28 |
Configuration | Explanation
|
29 |
:-- | :--
|
30 |
**`BASELINE`** | a reference functionally equivalent to the original model
|
31 |
+
**`BASIC`** | all linear algebraic operands quantized to `MXINT8-64`
|
32 |
|
33 |
|
34 |
### Usage
|
|
|
49 |
```python
|
50 |
from dmx.compressor.modeling import DmxModel
|
51 |
import lm_eval
|
52 |
+
from lm_eval.models.huggingface import HFLM
|
53 |
|
54 |
+
lm_eval.api.registry.register_model("hf", HFLM)
|
55 |
model_args = "pretrained=d-matrix/gpt2-xl,trust_remote_code=True"
|
56 |
|
57 |
lm = lm_eval.api.registry.get_model("hf").create_from_arg_string(model_args, {"batch_size": 1})
|