Add Dockerfile with CUDA 12.2 support for audio-chat

This commit is contained in:
root
2026-05-01 13:54:57 +00:00
parent e2d3cbe783
commit df2a97b85a

46
Dockerfile Normal file
View File

@@ -0,0 +1,46 @@
ARG BASE_IMAGE=nvidia/cuda:12.2.2-runtime-ubuntu22.04
FROM ${BASE_IMAGE}
# Set environment variables
ENV PYTHONUNBUFFERED=1 \
PYTHONDONTWRITEBYTECODE=1 \
DEBIAN_FRONTEND=noninteractive \
MODEL_CACHE_DIR=/models
# Install Python and system dependencies
RUN apt-get update && apt-get install -y --no-install-recommends \
python3.10 \
python3.10-venv \
python3-pip \
build-essential \
git \
curl \
wget \
libsndfile1 \
portaudio19-dev \
ffmpeg \
&& rm -rf /var/lib/apt/lists/*
# Set up Python virtual environment
WORKDIR /app
COPY requirements.txt .
RUN pip install --no-cache-dir --upgrade pip && \
pip install --no-cache-dir -r requirements.txt
# Copy application code
COPY . .
# Create model cache directory
RUN mkdir -p ${MODEL_CACHE_DIR}
# Set environment variables for models
ENV TRANSFORMERS_CACHE=${MODEL_CACHE_DIR} \
HF_HOME=${MODEL_CACHE_DIR} \
PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
# Expose WebSocket port
EXPOSE 8000
# Run the application
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]