Spaces:

thechaiexperiment
/

TeaRAG

Sleeping

App Files Files Community

thechaiexperiment commited on Dec 10, 2024

Commit

b16ca60

1 Parent(s): fe819e8

Update Dockerfile

Browse files

Files changed (1) hide show

Dockerfile +14 -9

Dockerfile CHANGED Viewed

@@ -1,5 +1,7 @@
 FROM python:3.9-slim
 WORKDIR /code
 # Install system dependencies
@@ -7,34 +9,37 @@ RUN apt-get update && apt-get install -y \
     build-essential \
     && rm -rf /var/lib/apt/lists/*
-# Copy requirements first for better caching
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
-# Install sentencepiece
 RUN pip install sentencepiece
-# Create the nltk_data directory and set permissions
 RUN mkdir -p /code/nltk_data && chmod -R 777 /code/nltk_data
-# Set the NLTK_DATA environment variable to the created directory
 ENV NLTK_DATA=/code/nltk_data
 # Download punkt data for NLTK
 RUN python -c "import nltk; nltk.download('punkt')"
-# Ensure the transformer cache directory exists and set correct permissions
 RUN mkdir -p /code/transformers_cache && chmod -R 777 /code/transformers_cache
 ENV TRANSFORMERS_CACHE=/code/transformers_cache
-# Download the sentence-transformers model to avoid recreating it
 RUN python -c "from sentence_transformers import SentenceTransformer; SentenceTransformer('sentence-transformers/all-MiniLM-L6-v2')"
 RUN python -c "from sentence_transformers import CrossEncoder; CrossEncoder('cross-encoder/ms-marco-MiniLM-L-6-v2')"
-# Copy your code and models
 COPY . .
-# Run FastAPI
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]
 ENV TRANSFORMERS_CACHE=/code/transformers_cache

+# Use python:3.9-slim as the base image
 FROM python:3.9-slim
+# Set the working directory inside the container
 WORKDIR /code
 # Install system dependencies
     build-essential \
     && rm -rf /var/lib/apt/lists/*
+# Copy requirements.txt first for better caching
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
+# Install sentencepiece for tokenization
 RUN pip install sentencepiece
+# Create and set permissions for the NLTK data directory
 RUN mkdir -p /code/nltk_data && chmod -R 777 /code/nltk_data
 ENV NLTK_DATA=/code/nltk_data
 # Download punkt data for NLTK
 RUN python -c "import nltk; nltk.download('punkt')"
+# Create and set permissions for the Transformers cache directory
 RUN mkdir -p /code/transformers_cache && chmod -R 777 /code/transformers_cache
 ENV TRANSFORMERS_CACHE=/code/transformers_cache
+ENV HF_HOME=/code/transformers_cache  # Adding HF_HOME for Hugging Face cache
+# Download sentence-transformers model to avoid recreating it at runtime
 RUN python -c "from sentence_transformers import SentenceTransformer; SentenceTransformer('sentence-transformers/all-MiniLM-L6-v2')"
 RUN python -c "from sentence_transformers import CrossEncoder; CrossEncoder('cross-encoder/ms-marco-MiniLM-L-6-v2')"
+# Copy your application code into the container
 COPY . .
+# Expose port 7860 for FastAPI
+EXPOSE 7860
+# Command to run FastAPI using Uvicorn
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]
+# Set environment variable for cache location
 ENV TRANSFORMERS_CACHE=/code/transformers_cache