Add Dockerfile with CUDA 12.2 support for audio-chat

2026-05-01 13:54:57 +00:00
parent e2d3cbe783
commit df2a97b85a
1 changed files with 46 additions and 0 deletions
--- a/46
+++ b/46
@@ -0,0 +1,46 @@
+ARG BASE_IMAGE=nvidia/cuda:12.2.2-runtime-ubuntu22.04
+
+FROM ${BASE_IMAGE}
+
+# Set environment variables
+ENV PYTHONUNBUFFERED=1 \
+    PYTHONDONTWRITEBYTECODE=1 \
+    DEBIAN_FRONTEND=noninteractive \
+    MODEL_CACHE_DIR=/models
+
+# Install Python and system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    python3.10 \
+    python3.10-venv \
+    python3-pip \
+    build-essential \
+    git \
+    curl \
+    wget \
+    libsndfile1 \
+    portaudio19-dev \
+    ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+
+# Set up Python virtual environment
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir --upgrade pip && \
+    pip install --no-cache-dir -r requirements.txt
+
+# Copy application code
+COPY . .
+
+# Create model cache directory
+RUN mkdir -p ${MODEL_CACHE_DIR}
+
+# Set environment variables for models
+ENV TRANSFORMERS_CACHE=${MODEL_CACHE_DIR} \
+    HF_HOME=${MODEL_CACHE_DIR} \
+    PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+
+# Expose WebSocket port
+EXPOSE 8000
+
+# Run the application
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]