docker-llama.cpp / Dockerfile
nouamanetazi's picture
nouamanetazi HF Staff
fix
133c842
raw
history blame
680 Bytes
# read the doc: https://huggingface.co/docs/hub/spaces-sdks-docker
# you will also find guides on how best to write your Dockerfile
FROM python:3.9 AS downloader
WORKDIR /app
RUN mkdir -p ./models/7B
RUN wget -O ./models/7B/gpt-j-ggml-model-q4_0.bin https://huggingface.co/ocordeiro/ggml-gpt-j-6b-q4_0/resolve/main/gpt-j-ggml-model-q4_0.bin
FROM ghcr.io/ggerganov/llama.cpp:light
COPY --from=downloader /app/models/7B/gpt-j-ggml-model-q4_0.bin ./models/7B/gpt-j-ggml-model-q4_0.bin
CMD ["-m", "/models/7B/gpt-j-ggml-model-q4_0.bin", "-p", "Building a website can be done in 10 simple steps:", "-n", "512"]
# CMD ["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "7860"]