44 lines
1.1 KiB
Docker
44 lines
1.1 KiB
Docker
FROM nvidia/cuda:12.1.1-cudnn8-runtime-ubuntu22.04
|
|
|
|
# Prevent interactive prompts during package installation
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
|
|
# Install Python and system dependencies
|
|
RUN apt-get update && apt-get install -y \
|
|
python3 \
|
|
python3-pip \
|
|
python3-dev \
|
|
libgl1-mesa-glx \
|
|
libglib2.0-0 \
|
|
libsm6 \
|
|
libxext6 \
|
|
libxrender-dev \
|
|
wget \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
# Set working directory
|
|
WORKDIR /app
|
|
|
|
# Copy requirements first for better caching
|
|
COPY requirements.txt .
|
|
|
|
# Install Python dependencies (with pip cache for faster rebuilds)
|
|
RUN --mount=type=cache,target=/root/.cache/pip \
|
|
pip3 install -r requirements.txt
|
|
|
|
# Download YOLO11s model (small, efficient)
|
|
RUN python3 -c "from ultralytics import YOLO; YOLO('yolo11s.pt')"
|
|
|
|
# Copy application code
|
|
COPY main.py .
|
|
|
|
# Expose port
|
|
EXPOSE 5002
|
|
|
|
# Health check
|
|
HEALTHCHECK --interval=30s --timeout=10s --start-period=60s --retries=3 \
|
|
CMD python3 -c "import urllib.request; urllib.request.urlopen('http://localhost:5002/health')" || exit 1
|
|
|
|
# Run the service
|
|
CMD ["python3", "-m", "uvicorn", "main:app", "--host", "0.0.0.0", "--port", "5002"]
|