Spaces:
Runtime error
Runtime error
| FROM nvidia/cuda:11.8.0-cudnn8-runtime-ubuntu22.04 | |
| # Set environment variables | |
| ENV DEBIAN_FRONTEND=noninteractive | |
| ENV PYTHONUNBUFFERED=1 | |
| ENV HF_HOME=/app/.cache/huggingface | |
| ENV TRANSFORMERS_CACHE=/app/.cache/huggingface/transformers | |
| ENV MPLCONFIGDIR=/tmp/matplotlib | |
| # Force PyTorch to use the NCCl backend | |
| ENV PYTORCH_CUDA_ALLOC_CONF=max_split_size_mb:128 | |
| # Create necessary directories with proper permissions | |
| RUN mkdir -p /app/.cache/huggingface/transformers && \ | |
| mkdir -p /tmp/matplotlib && \ | |
| mkdir -p /app/gradio_cached_examples && \ | |
| chmod -R 777 /app && \ | |
| chmod -R 777 /tmp/matplotlib | |
| # Install system dependencies | |
| RUN apt-get update && apt-get install -y --no-install-recommends \ | |
| build-essential \ | |
| git \ | |
| curl \ | |
| ca-certificates \ | |
| python3-pip \ | |
| python3-dev \ | |
| python3-setuptools \ | |
| && rm -rf /var/lib/apt/lists/* | |
| # Create a working directory | |
| WORKDIR /app | |
| # Add a script to check GPU status at startup | |
| RUN echo '#!/bin/bash \n\ | |
| echo "Checking NVIDIA GPU status..." \n\ | |
| if ! command -v nvidia-smi &> /dev/null; then \n\ | |
| echo "WARNING: nvidia-smi command not found. NVIDIA driver might not be installed." \n\ | |
| else \n\ | |
| echo "NVIDIA driver found. Running nvidia-smi:" \n\ | |
| nvidia-smi \n\ | |
| fi \n\ | |
| echo "Environment variables for GPU:" \n\ | |
| echo "CUDA_VISIBLE_DEVICES=${CUDA_VISIBLE_DEVICES}" \n\ | |
| echo "NVIDIA_VISIBLE_DEVICES=${NVIDIA_VISIBLE_DEVICES}" \n\ | |
| exec "$@"' > /entrypoint.sh && \ | |
| chmod +x /entrypoint.sh | |
| # Copy requirements file | |
| COPY requirements.txt . | |
| # Upgrade pip and install dependencies in specific order to avoid conflicts | |
| RUN pip3 install --no-cache-dir --upgrade pip && \ | |
| # Install torch and torchvision first with CUDA support | |
| pip3 install --no-cache-dir torch==2.0.1+cu118 torchvision==0.15.2+cu118 --extra-index-url https://download.pytorch.org/whl/cu118 && \ | |
| # Install core dependencies | |
| pip3 install --no-cache-dir numpy==1.24.3 scipy==1.11.3 requests==2.31.0 && \ | |
| # Install typing-extensions first to ensure proper version for other packages | |
| pip3 install --no-cache-dir typing-extensions==4.10.0 && \ | |
| # Install huggingface dependencies | |
| pip3 install --no-cache-dir transformers==4.37.2 safetensors==0.4.1 huggingface_hub==0.19.4 && \ | |
| # Install timm for vision models | |
| pip3 install --no-cache-dir timm==0.9.11 && \ | |
| # Install nest-asyncio for handling nested event loops | |
| pip3 install --no-cache-dir nest-asyncio==1.5.8 && \ | |
| # Install lmdeploy and its dependencies first | |
| pip3 install --no-cache-dir "accelerate==0.30.0" && \ | |
| pip3 install --no-cache-dir "lmdeploy==0.5.3" && \ | |
| # Install other acceleration libraries | |
| pip3 install --no-cache-dir bitsandbytes==0.41.3 && \ | |
| # Install gradio | |
| pip3 install --no-cache-dir gradio==3.38.0 && \ | |
| # Install any remaining requirements | |
| pip3 install --no-cache-dir packaging==23.2 pyyaml==6.0.1 tqdm==4.66.1 openai==1.6.1 | |
| # Copy the application files | |
| COPY . . | |
| # Make sure the runtime directories exist and have proper permissions | |
| RUN mkdir -p gradio_cached_examples && \ | |
| chmod -R 777 gradio_cached_examples && \ | |
| mkdir -p .cache/huggingface/transformers && \ | |
| chmod -R 777 .cache | |
| # Make port 7860 available for the app | |
| EXPOSE 7860 | |
| # Use our entrypoint script to check GPU status before starting the app | |
| ENTRYPOINT ["/entrypoint.sh"] | |
| # Start the application - FIXED to point to the correct file | |
| CMD ["python3", "app.py"] | |