Spaces:

mknolan
/

internvl25-image-analyzer-clean

Paused

App Files Files Community

mknolan commited on Mar 19

Commit

1959bc7

verified ·

1 Parent(s): 4b8ace7

Fix Dockerfile CMD to point to app.py

Browse files

Updated the Dockerfile to correctly use app.py instead of app_internvl2.py

Files changed (1) hide show

Dockerfile +78 -21

Dockerfile CHANGED Viewed

@@ -1,34 +1,91 @@
-FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04
-# Set working directory
-WORKDIR /app
 # Install system dependencies
-RUN apt-get update && apt-get install -y \
-    python3 \
-    python3-pip \
     git \
-    ffmpeg \
-    libsm6 \
-    libxext6 \
     && rm -rf /var/lib/apt/lists/*
-# Upgrade pip
-RUN python3 -m pip install --upgrade pip
 # Copy requirements file
 COPY requirements.txt .
-# Install Python dependencies
-RUN pip install --no-cache-dir -r requirements.txt
-# Copy the rest of the application
 COPY . .
-# Set environment variables
-ENV PYTHONPATH=/app
-ENV PYTHONUNBUFFERED=1
-ENV PORT=7860
-# Set default command
-CMD ["python3", "app.py"]

+FROM nvidia/cuda:11.8.0-cudnn8-runtime-ubuntu22.04
+# Set environment variables
+ENV DEBIAN_FRONTEND=noninteractive
+ENV PYTHONUNBUFFERED=1
+ENV HF_HOME=/app/.cache/huggingface
+ENV TRANSFORMERS_CACHE=/app/.cache/huggingface/transformers
+ENV MPLCONFIGDIR=/tmp/matplotlib
+# Force PyTorch to use the NCCl backend
+ENV PYTORCH_CUDA_ALLOC_CONF=max_split_size_mb:128
+# Create necessary directories with proper permissions
+RUN mkdir -p /app/.cache/huggingface/transformers && \
+    mkdir -p /tmp/matplotlib && \
+    mkdir -p /app/gradio_cached_examples && \
+    chmod -R 777 /app && \
+    chmod -R 777 /tmp/matplotlib
 # Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    build-essential \
     git \
+    curl \
+    ca-certificates \
+    python3-pip \
+    python3-dev \
+    python3-setuptools \
     && rm -rf /var/lib/apt/lists/*
+# Create a working directory
+WORKDIR /app
+# Add a script to check GPU status at startup
+RUN echo '#!/bin/bash \n\
+echo "Checking NVIDIA GPU status..." \n\
+if ! command -v nvidia-smi &> /dev/null; then \n\
+    echo "WARNING: nvidia-smi command not found. NVIDIA driver might not be installed." \n\
+else \n\
+    echo "NVIDIA driver found. Running nvidia-smi:" \n\
+    nvidia-smi \n\
+fi \n\
+echo "Environment variables for GPU:" \n\
+echo "CUDA_VISIBLE_DEVICES=${CUDA_VISIBLE_DEVICES}" \n\
+echo "NVIDIA_VISIBLE_DEVICES=${NVIDIA_VISIBLE_DEVICES}" \n\
+exec "$@"' > /entrypoint.sh && \
+chmod +x /entrypoint.sh
 # Copy requirements file
 COPY requirements.txt .
+# Upgrade pip and install dependencies in specific order to avoid conflicts
+RUN pip3 install --no-cache-dir --upgrade pip && \
+    # Install torch and torchvision first with CUDA support
+    pip3 install --no-cache-dir torch==2.0.1+cu118 torchvision==0.15.2+cu118 --extra-index-url https://download.pytorch.org/whl/cu118 && \
+    # Install core dependencies
+    pip3 install --no-cache-dir numpy==1.24.3 scipy==1.11.3 requests==2.31.0 && \
+    # Install typing-extensions first to ensure proper version for other packages
+    pip3 install --no-cache-dir typing-extensions==4.10.0 && \
+    # Install huggingface dependencies
+    pip3 install --no-cache-dir transformers==4.37.2 safetensors==0.4.1 huggingface_hub==0.19.4 && \
+    # Install timm for vision models
+    pip3 install --no-cache-dir timm==0.9.11 && \
+    # Install nest-asyncio for handling nested event loops
+    pip3 install --no-cache-dir nest-asyncio==1.5.8 && \
+    # Install lmdeploy and its dependencies first
+    pip3 install --no-cache-dir "accelerate==0.30.0" && \
+    pip3 install --no-cache-dir "lmdeploy==0.5.3" && \
+    # Install other acceleration libraries
+    pip3 install --no-cache-dir bitsandbytes==0.41.3 && \
+    # Install gradio
+    pip3 install --no-cache-dir gradio==3.38.0 && \
+    # Install any remaining requirements
+    pip3 install --no-cache-dir packaging==23.2 pyyaml==6.0.1 tqdm==4.66.1 openai==1.6.1
+# Copy the application files
 COPY . .
+# Make sure the runtime directories exist and have proper permissions
+RUN mkdir -p gradio_cached_examples && \
+    chmod -R 777 gradio_cached_examples && \
+    mkdir -p .cache/huggingface/transformers && \
+    chmod -R 777 .cache
+# Make port 7860 available for the app
+EXPOSE 7860
+# Use our entrypoint script to check GPU status before starting the app
+ENTRYPOINT ["/entrypoint.sh"]
+# Start the application - FIXED to point to the correct file
+CMD ["python3", "app.py"]