LLM-34B-GGUF-Chat-V4

Paused

LLM-34B-GGUF-Chat-V4 / Dockerfile

Update Dockerfile

a7294db verified over 1 year ago

722 Bytes

	# Use an alias for the base image for easier updates
	FROM python:3.10 as base

	# Set model
	ENV MODEL=dranger003/UNA-SimpleSmaug-34b-v1beta-iMat.GGUF
	ENV QUANT=IQ3_XS
	ENV CHAT_TEMPLATE=chatml

	# Set the working directory
	WORKDIR /app

	# Install Python requirements
	COPY ./requirements.txt /app/
	RUN pip install --no-cache-dir --upgrade -r requirements.txt

	# Download model
	RUN MODEL_NAME_FILE=$(echo ${MODEL#*/} \| tr '[:upper:]' '[:lower:]' \| sed 's/-gguf$//') && \
	wget https://huggingface.co/dranger003/UNA-SimpleSmaug-34b-v1beta-iMat.GGUF/resolve/main/ggml-una-simplesmaug-34b-v1beta-iq3_xs.gguf -O model.gguf

	# Copy the rest of your application
	COPY . .

	# Command to run the application
	CMD ["python", "app.py"]