RedHatAI
/

OpenHermes-2.5-Mistral-7B-pruned50-quant-ds

Text Generation

Model card Files Files and versions

mgoin commited on Nov 21, 2023

Commit

b3b9cd2

·

1 Parent(s): fed89b0

Update README.md

Files changed (1) hide show

README.md +2 -2

README.md CHANGED Viewed

@@ -28,7 +28,7 @@ from deepsparse import TextGeneration
 system_message = ""
 prompt = "Write a quick sort algorithm in Python"
 formatted_prompt = f"<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
-model = TextGeneration(model="hf:mgoin/Nous-Hermes-llama-2-7b-pruned50-quant-ds")
 print(model(formatted_prompt, max_new_tokens=500).generations[0].text)
 ```
@@ -51,7 +51,7 @@ See the `recipe.yaml` in this repo and follow the instructions below.
 git clone https://github.com/neuralmagic/sparseml
 pip install -e "sparseml[transformers]"
 python sparseml/src/sparseml/transformers/sparsification/obcq/obcq.py teknium/OpenHermes-2.5-Mistral-7B open_platypus --recipe recipe.yaml --save True
-python sparseml/src/sparseml/transformers/sparsification/obcq/export.py --task text-generation --model_path obcq_deployment
 cp deployment/model.onnx deployment/model-orig.onnx
 ```

 system_message = ""
 prompt = "Write a quick sort algorithm in Python"
 formatted_prompt = f"<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
+model = TextGeneration(model="hf:mgoin/OpenHermes-2.5-Mistral-7B-pruned50-quant-ds")
 print(model(formatted_prompt, max_new_tokens=500).generations[0].text)
 ```
 git clone https://github.com/neuralmagic/sparseml
 pip install -e "sparseml[transformers]"
 python sparseml/src/sparseml/transformers/sparsification/obcq/obcq.py teknium/OpenHermes-2.5-Mistral-7B open_platypus --recipe recipe.yaml --save True
+python sparseml/src/sparseml/transformers/sparsification/obcq/export.py --task text-generation --model_path obcq_deployment --sequence_length 4096
 cp deployment/model.onnx deployment/model-orig.onnx
 ```