# Use a base image with a suitable Python and PyTorch version
FROM pytorch/pytorch:2.0.0-cuda11.7-cudnn8-runtime

# Set working directory
WORKDIR /app

# Copy your model files into the container
COPY . /app

# Set the PYANNOTE_CACHE environment variable
ENV PYANNOTE_CACHE=/app/.cache

# Install dependencies
RUN pip install --no-cache-dir -r requirements.txt

# Expose the port that your endpoint will listen on (if needed)
EXPOSE 8080

# Specify the command to run your endpoint (adjust if necessary)
CMD ["python", "handler.py"]