FROM nvidia/cuda:12.1.1-runtime-ubuntu22.04 | |
RUN apt-get update && apt-get install -y \ | |
git wget curl python3 python3-pip && rm -rf /var/lib/apt/lists/* | |
WORKDIR /app | |
COPY requirements.txt /app/requirements.txt | |
RUN pip install --no-cache-dir -r requirements.txt | |
COPY . /app | |
RUN mkdir -p /app/.cache && chmod -R 777 /app/.cache | |
ENV HF_HOME=/app/.cache | |
ENV TRANSFORMERS_CACHE=/app/.cache | |
ENV HF_HUB_CACHE=/app/.cache | |
ENV PORT=7860 | |
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"] | |