Spaces:

Axcel1
/

Medical_Chatbot

Sleeping

Axcel1 commited on Jul 22

Commit

0f7413f

verified ·

1 Parent(s): 7dada66

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,5 +1,5 @@
-# Use NVIDIA CUDA base image with Ubuntu and Python support
-FROM nvidia/cuda:12.1.1-devel-ubuntu22.04
 # Set working directory
 WORKDIR /app
@@ -9,26 +9,22 @@ RUN apt-get update && apt-get install -y \
     python3.10 \
     python3-pip \
     python3.10-venv \
-    build-essential \
-    cmake \
     git \
     curl \
     wget \
     && rm -rf /var/lib/apt/lists/*
-# Use python3.10 as default
 RUN update-alternatives --install /usr/bin/python python /usr/bin/python3.10 1
 # Upgrade pip
 RUN pip install --upgrade pip
-# Set CUDA build flag for llama-cpp-python
-ENV CMAKE_ARGS="-DGGML_CUDA=on"
-# Copy requirements first for layer caching
 COPY requirements.txt .
-# Install dependencies (llama-cpp-python will compile with CUDA here)
 RUN pip install --no-cache-dir -r requirements.txt
 # Copy app code
@@ -37,12 +33,12 @@ COPY . .
 # Create models directory
 RUN mkdir -p models
-# Expose Gradio port
 EXPOSE 7860
-# Environment for Gradio
 ENV GRADIO_SERVER_NAME="0.0.0.0"
 ENV GRADIO_SERVER_PORT=7860
-# Run the app
 CMD ["python", "app.py"]

+# Use NVIDIA CUDA base image with Python support
+FROM nvidia/cuda:12.1.1-runtime-ubuntu22.04
 # Set working directory
 WORKDIR /app
     python3.10 \
     python3-pip \
     python3.10-venv \
     git \
     curl \
     wget \
     && rm -rf /var/lib/apt/lists/*
+# Make python3.10 the default
 RUN update-alternatives --install /usr/bin/python python /usr/bin/python3.10 1
 # Upgrade pip
 RUN pip install --upgrade pip
+# ✅ Install prebuilt llama-cpp-python CUDA wheel (cu121)
+RUN pip install --no-cache-dir llama-cpp-python --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cu121
+# Copy requirements.txt and install remaining dependencies
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
 # Copy app code
 # Create models directory
 RUN mkdir -p models
+# Expose Gradio or web port
 EXPOSE 7860
+# Gradio settings
 ENV GRADIO_SERVER_NAME="0.0.0.0"
 ENV GRADIO_SERVER_PORT=7860
+# Start app
 CMD ["python", "app.py"]