Add Dockerfile with CUDA 12.2 support for audio-chat
This commit is contained in:
46
Dockerfile
Normal file
46
Dockerfile
Normal file
@@ -0,0 +1,46 @@
|
|||||||
|
ARG BASE_IMAGE=nvidia/cuda:12.2.2-runtime-ubuntu22.04
|
||||||
|
|
||||||
|
FROM ${BASE_IMAGE}
|
||||||
|
|
||||||
|
# Set environment variables
|
||||||
|
ENV PYTHONUNBUFFERED=1 \
|
||||||
|
PYTHONDONTWRITEBYTECODE=1 \
|
||||||
|
DEBIAN_FRONTEND=noninteractive \
|
||||||
|
MODEL_CACHE_DIR=/models
|
||||||
|
|
||||||
|
# Install Python and system dependencies
|
||||||
|
RUN apt-get update && apt-get install -y --no-install-recommends \
|
||||||
|
python3.10 \
|
||||||
|
python3.10-venv \
|
||||||
|
python3-pip \
|
||||||
|
build-essential \
|
||||||
|
git \
|
||||||
|
curl \
|
||||||
|
wget \
|
||||||
|
libsndfile1 \
|
||||||
|
portaudio19-dev \
|
||||||
|
ffmpeg \
|
||||||
|
&& rm -rf /var/lib/apt/lists/*
|
||||||
|
|
||||||
|
# Set up Python virtual environment
|
||||||
|
WORKDIR /app
|
||||||
|
COPY requirements.txt .
|
||||||
|
RUN pip install --no-cache-dir --upgrade pip && \
|
||||||
|
pip install --no-cache-dir -r requirements.txt
|
||||||
|
|
||||||
|
# Copy application code
|
||||||
|
COPY . .
|
||||||
|
|
||||||
|
# Create model cache directory
|
||||||
|
RUN mkdir -p ${MODEL_CACHE_DIR}
|
||||||
|
|
||||||
|
# Set environment variables for models
|
||||||
|
ENV TRANSFORMERS_CACHE=${MODEL_CACHE_DIR} \
|
||||||
|
HF_HOME=${MODEL_CACHE_DIR} \
|
||||||
|
PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
|
||||||
|
|
||||||
|
# Expose WebSocket port
|
||||||
|
EXPOSE 8000
|
||||||
|
|
||||||
|
# Run the application
|
||||||
|
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]
|
||||||
Reference in New Issue
Block a user