Add Dockerfile with CUDA 12.2 support for audio-chat

2026-05-01 13:54:57 +00:00
parent e2d3cbe783
commit df2a97b85a
1 changed files with 46 additions and 0 deletions
--- a/46
+++ b/46
@@ -0,0 +1,46 @@
 ARG BASE_IMAGE=nvidia/cuda:12.2.2-runtime-ubuntu22.04
 FROM ${BASE_IMAGE}
 # Set environment variables
 ENV PYTHONUNBUFFERED=1 \
    PYTHONDONTWRITEBYTECODE=1 \
    DEBIAN_FRONTEND=noninteractive \
    MODEL_CACHE_DIR=/models
 # Install Python and system dependencies
 RUN apt-get update && apt-get install -y --no-install-recommends \
    python3.10 \
    python3.10-venv \
    python3-pip \
    build-essential \
    git \
    curl \
    wget \
    libsndfile1 \
    portaudio19-dev \
    ffmpeg \
    && rm -rf /var/lib/apt/lists/*
 # Set up Python virtual environment
 WORKDIR /app
 COPY requirements.txt .
 RUN pip install --no-cache-dir --upgrade pip && \
    pip install --no-cache-dir -r requirements.txt
 # Copy application code
 COPY . .
 # Create model cache directory
 RUN mkdir -p ${MODEL_CACHE_DIR}
 # Set environment variables for models
 ENV TRANSFORMERS_CACHE=${MODEL_CACHE_DIR} \
    HF_HOME=${MODEL_CACHE_DIR} \
    PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
 # Expose WebSocket port
 EXPOSE 8000
 # Run the application
 CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]