Spaces:

FractalAI
/

Research

Sleeping

App Files Files Community

Proff12 commited on Sep 24

Commit

c4089f6

verified ·

1 Parent(s): 6c671a5

Update Dockerfile

Browse files

Files changed (1) hide show

Dockerfile +36 -14

Dockerfile CHANGED Viewed

@@ -1,48 +1,70 @@
 # --- Stage 1: Build React frontend ---
 FROM node:20-alpine AS frontend
 WORKDIR /app/frontend
 COPY frontend/package*.json ./
 COPY frontend/package-lock.json ./
-RUN npm install
 COPY frontend/ ./
 RUN npm run build
 # --- Stage 2: GPU-enabled Python backend ---
-# Requires NVIDIA Container Toolkit on host and runtime flag: --gpus all
 FROM nvidia/cuda:12.1.1-cudnn8-runtime-ubuntu22.04 AS backend
-ENV DEBIAN_FRONTEND=noninteractive             PYTHONDONTWRITEBYTECODE=1             PYTHONUNBUFFERED=1             PIP_NO_CACHE_DIR=1
-ENV HF_HOME=/app/.cache/huggingface
 RUN useradd -m appuser
-# Create cache directory and set permissions before switching
-RUN mkdir -p /app/.cache/huggingface/transformers && \
     chown -R appuser:appuser /app/.cache
 # Switch to non-root user
 USER appuser
-# Install Python and system deps
-RUN apt-get update && apt-get install -y --no-install-recommends             python3 python3-pip python3-venv git &&             rm -rf /var/lib/apt/lists/*
 WORKDIR /app
-# Install CUDA-enabled PyTorch (cu121)
-RUN python3 -m pip install --upgrade pip &&             python3 -m pip install --index-url https://download.pytorch.org/whl/cu121 torch==2.4.1+cu121
-# Install remaining Python deps
 COPY backend/requirements.txt /app/backend/requirements.txt
 RUN python3 -m pip install -r /app/backend/requirements.txt
 # Copy backend code
 COPY backend/ /app/backend/
-# Copy frontend build to a static dir served by FastAPI
 RUN mkdir -p /app/static
 COPY --from=frontend /app/frontend/dist/ /app/static/
-ENV STATIC_DIR=/app/static             MODEL_ID=FractalAIResearch/Fathom-R1-14B             PIPELINE_TASK=text-generation             QUANTIZE=auto
 EXPOSE 8000
 CMD ["uvicorn", "app.main:app", "--app-dir", "/app/backend", "--host", "0.0.0.0", "--port", "8000"]

 # --- Stage 1: Build React frontend ---
 FROM node:20-alpine AS frontend
 WORKDIR /app/frontend
+# Install dependencies
 COPY frontend/package*.json ./
 COPY frontend/package-lock.json ./
+RUN npm install --frozen-lockfile
+# Build frontend
 COPY frontend/ ./
 RUN npm run build
 # --- Stage 2: GPU-enabled Python backend ---
 FROM nvidia/cuda:12.1.1-cudnn8-runtime-ubuntu22.04 AS backend
+# Environment setup
+ENV DEBIAN_FRONTEND=noninteractive \
+    PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1 \
+    PIP_NO_CACHE_DIR=1 \
+    HF_HOME=/app/.cache/huggingface
+# Create non-root user
 RUN useradd -m appuser
+# Create cache directory and set permissions
+RUN mkdir -p /app/.cache/huggingface && \
     chown -R appuser:appuser /app/.cache
 # Switch to non-root user
 USER appuser
+# Install Python and system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    python3 python3-pip python3-venv git curl && \
+    rm -rf /var/lib/apt/lists/*
 WORKDIR /app
+# Upgrade pip and install CUDA-enabled PyTorch
+RUN python3 -m pip install --upgrade pip && \
+    python3 -m pip install --index-url https://download.pytorch.org/whl/cu121 torch==2.4.1+cu121
+# Install Python dependencies
 COPY backend/requirements.txt /app/backend/requirements.txt
 RUN python3 -m pip install -r /app/backend/requirements.txt
 # Copy backend code
 COPY backend/ /app/backend/
+# Copy frontend build to static directory
 RUN mkdir -p /app/static
 COPY --from=frontend /app/frontend/dist/ /app/static/
+# App-specific environment variables
+ENV STATIC_DIR=/app/static \
+    MODEL_ID=FractalAIResearch/Fathom-R1-14B \
+    PIPELINE_TASK=text-generation \
+    QUANTIZE=auto
+# Optional: Healthcheck endpoint
+HEALTHCHECK --interval=30s --timeout=10s --start-period=10s --retries=3 \
+  CMD curl -f http://localhost:8000/health || exit 1
 EXPOSE 8000
+# Start FastAPI app
 CMD ["uvicorn", "app.main:app", "--app-dir", "/app/backend", "--host", "0.0.0.0", "--port", "8000"]