XanderJC commited on
Commit
4e0631e
·
1 Parent(s): e8211bd
Files changed (1) hide show
  1. Dockerfile +4 -35
Dockerfile CHANGED
@@ -19,43 +19,12 @@ RUN apt-get install -y --no-install-recommends \
19
  libglib2.0-0 \
20
  libgl1-mesa-glx \
21
  libpq-dev \
22
- make \
23
- cuda
24
-
25
- # Add NVIDIA CUDA repository
26
- RUN apt-get update && apt-get install -y wget
27
- RUN wget https://developer.download.nvidia.com/compute/cuda/repos/debian11/x86_64/cuda-keyring_1.1-1_all.deb
28
- RUN dpkg -i cuda-keyring_1.1-1_all.deb
29
- RUN apt-get update
30
-
31
- RUN apt-get install -y --no-install-recommends \
32
- build-essential \
33
- python3-dev \
34
- libglib2.0-0 \
35
- libgl1-mesa-glx \
36
- libpq-dev \
37
- make \
38
- cuda-toolkit-12-2
39
-
40
- # Set CUDA environment variables
41
- ENV CUDA_HOME=/usr/local/cuda
42
- ENV PATH=${CUDA_HOME}/bin:${PATH}
43
- ENV LD_LIBRARY_PATH=${CUDA_HOME}/lib64:${LD_LIBRARY_PATH}
44
-
45
  # insall latest vllm
46
-
47
- RUN pip install uv
48
- RUN uv venv --python 3.11 --python-preference managed
49
- RUN . .venv/bin/activate
50
- RUN uv pip install setuptools
51
-
52
- RUN uv pip install vllm==0.7.2
53
 
54
  # Install transformers from source, need specific revision for Qwen2.5 as
55
  # breaking changes in master
56
- RUN uv pip install --upgrade git+https://github.com/huggingface/transformers.git@336dc69d63d56f232a183a3e7f52790429b871ef
57
-
58
- RUN uv pip install ray[adag]
59
- RUN uv pip install cupy-cuda12x
60
 
61
- ENTRYPOINT ["/bin/bash", "-c", ". .venv/bin/activate && export VLLM_USE_V1=1 && python -m vllm.entrypoints.openai.api_server --model convergence-ai/proxy-lite --trust-remote-code --tokenizer-pool-size 20 --limit-mm-per-prompt image=1 --enable-auto-tool-choice --tool-call-parser hermes --port 7860"]
 
19
  libglib2.0-0 \
20
  libgl1-mesa-glx \
21
  libpq-dev \
22
+ make
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  # insall latest vllm
24
+ RUN pip install vllm==0.7.2
 
 
 
 
 
 
25
 
26
  # Install transformers from source, need specific revision for Qwen2.5 as
27
  # breaking changes in master
28
+ RUN pip install --upgrade git+https://github.com/huggingface/transformers.git@336dc69d63d56f232a183a3e7f52790429b871ef
 
 
 
29
 
30
+ ENTRYPOINT ["sh", "-c", "python -m vllm.entrypoints.openai.api_server --model convergence-ai/proxy-lite --trust-remote-code --tokenizer-pool-size 10 --limit-mm-per-prompt image=2 --enable-auto-tool-choice --tool-call-parser hermes --port 7860"]