Spaces:
Running
on
A100
Running
on
A100
reset
Browse files- Dockerfile +4 -35
Dockerfile
CHANGED
@@ -19,43 +19,12 @@ RUN apt-get install -y --no-install-recommends \
|
|
19 |
libglib2.0-0 \
|
20 |
libgl1-mesa-glx \
|
21 |
libpq-dev \
|
22 |
-
make
|
23 |
-
cuda
|
24 |
-
|
25 |
-
# Add NVIDIA CUDA repository
|
26 |
-
RUN apt-get update && apt-get install -y wget
|
27 |
-
RUN wget https://developer.download.nvidia.com/compute/cuda/repos/debian11/x86_64/cuda-keyring_1.1-1_all.deb
|
28 |
-
RUN dpkg -i cuda-keyring_1.1-1_all.deb
|
29 |
-
RUN apt-get update
|
30 |
-
|
31 |
-
RUN apt-get install -y --no-install-recommends \
|
32 |
-
build-essential \
|
33 |
-
python3-dev \
|
34 |
-
libglib2.0-0 \
|
35 |
-
libgl1-mesa-glx \
|
36 |
-
libpq-dev \
|
37 |
-
make \
|
38 |
-
cuda-toolkit-12-2
|
39 |
-
|
40 |
-
# Set CUDA environment variables
|
41 |
-
ENV CUDA_HOME=/usr/local/cuda
|
42 |
-
ENV PATH=${CUDA_HOME}/bin:${PATH}
|
43 |
-
ENV LD_LIBRARY_PATH=${CUDA_HOME}/lib64:${LD_LIBRARY_PATH}
|
44 |
-
|
45 |
# insall latest vllm
|
46 |
-
|
47 |
-
RUN pip install uv
|
48 |
-
RUN uv venv --python 3.11 --python-preference managed
|
49 |
-
RUN . .venv/bin/activate
|
50 |
-
RUN uv pip install setuptools
|
51 |
-
|
52 |
-
RUN uv pip install vllm==0.7.2
|
53 |
|
54 |
# Install transformers from source, need specific revision for Qwen2.5 as
|
55 |
# breaking changes in master
|
56 |
-
RUN
|
57 |
-
|
58 |
-
RUN uv pip install ray[adag]
|
59 |
-
RUN uv pip install cupy-cuda12x
|
60 |
|
61 |
-
ENTRYPOINT ["
|
|
|
19 |
libglib2.0-0 \
|
20 |
libgl1-mesa-glx \
|
21 |
libpq-dev \
|
22 |
+
make
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
23 |
# insall latest vllm
|
24 |
+
RUN pip install vllm==0.7.2
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
|
26 |
# Install transformers from source, need specific revision for Qwen2.5 as
|
27 |
# breaking changes in master
|
28 |
+
RUN pip install --upgrade git+https://github.com/huggingface/transformers.git@336dc69d63d56f232a183a3e7f52790429b871ef
|
|
|
|
|
|
|
29 |
|
30 |
+
ENTRYPOINT ["sh", "-c", "python -m vllm.entrypoints.openai.api_server --model convergence-ai/proxy-lite --trust-remote-code --tokenizer-pool-size 10 --limit-mm-per-prompt image=2 --enable-auto-tool-choice --tool-call-parser hermes --port 7860"]
|