Update README.md
Browse files
README.md
CHANGED
@@ -40,7 +40,7 @@ docker run -d -p 8080:80 \
|
|
40 |
--device=/dev/neuron11 \
|
41 |
-e HF_TOKEN=${HF_TOKEN} \
|
42 |
public.ecr.aws/shtian/neuronx-tgi:latest \
|
43 |
-
--model-id davidshtian/Mistral-7B-Instruct-v0.2-neuron-
|
44 |
--max-batch-size 4 \
|
45 |
--max-input-length 16 \
|
46 |
--max-total-tokens 32
|
|
|
40 |
--device=/dev/neuron11 \
|
41 |
-e HF_TOKEN=${HF_TOKEN} \
|
42 |
public.ecr.aws/shtian/neuronx-tgi:latest \
|
43 |
+
--model-id davidshtian/Mistral-7B-Instruct-v0.2-neuron-4x2048-24-cores-2.18 \
|
44 |
--max-batch-size 4 \
|
45 |
--max-input-length 16 \
|
46 |
--max-total-tokens 32
|