# Use a base image with a suitable Python and PyTorch version FROM pytorch/pytorch:2.0.0-cuda11.7-cudnn8-runtime # Set working directory WORKDIR /app # Copy your model files into the container COPY . /app # Set the PYANNOTE_CACHE environment variable ENV PYANNOTE_CACHE=/app/.cache # Install dependencies RUN pip install --no-cache-dir -r requirements.txt # Expose the port that your endpoint will listen on (if needed) EXPOSE 8080 # Specify the command to run your endpoint (adjust if necessary) CMD ["python", "handler.py"]