LLM-34B-GGUF-Chat-V4 / Dockerfile
chenhaodev's picture
Update Dockerfile
a7294db verified
raw
history blame contribute delete
722 Bytes
# Use an alias for the base image for easier updates
FROM python:3.10 as base
# Set model
ENV MODEL=dranger003/UNA-SimpleSmaug-34b-v1beta-iMat.GGUF
ENV QUANT=IQ3_XS
ENV CHAT_TEMPLATE=chatml
# Set the working directory
WORKDIR /app
# Install Python requirements
COPY ./requirements.txt /app/
RUN pip install --no-cache-dir --upgrade -r requirements.txt
# Download model
RUN MODEL_NAME_FILE=$(echo ${MODEL#*/} | tr '[:upper:]' '[:lower:]' | sed 's/-gguf$//') && \
wget https://huggingface.co/dranger003/UNA-SimpleSmaug-34b-v1beta-iMat.GGUF/resolve/main/ggml-una-simplesmaug-34b-v1beta-iq3_xs.gguf -O model.gguf
# Copy the rest of your application
COPY . .
# Command to run the application
CMD ["python", "app.py"]