MistralVLLM / Dockerfile
SuperSecureHuman's picture
Update Dockerfile
f76de01
raw
history blame
712 Bytes
# Use Ubuntu 22.04 as the base image
FROM ubuntu:22.04
# Install Python 3 and pip
RUN apt-get update && \
apt-get install -y python3 python3-pip && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
# Upgrade pip and install Python packages
RUN pip3 install --upgrade pip
RUN pip3 install transformers
RUN pip3 install "fschat[model_worker,webui]"
RUN pip install accelerate pandas numpy
# run this command - python -m vllm.entrypoints.openai.api_server --model mistralai/Mistral-7B-Instruct-v0.1
# to start the server
ENTRYPOINT [ "python3", "-m", "fastchat.serve.openai_api_server", "--host", "0.0.0.0", "--port", "8080", "--device", "cpu", "--model-path", "mistralai/Mistral-7B-Instruct-v0.1"]