|
FROM python:3.10-slim |
|
|
|
|
|
RUN apt-get update && apt-get install -y \ |
|
build-essential \ |
|
curl \ |
|
software-properties-common \ |
|
git \ |
|
tesseract-ocr \ |
|
tesseract-ocr-ind \ |
|
libgl1-mesa-glx \ |
|
libglib2.0-0 \ |
|
&& rm -rf /var/lib/apt/lists/* |
|
|
|
|
|
RUN curl -sL https://deb.nodesource.com/setup_18.x | bash - && \ |
|
apt-get install -y nodejs |
|
|
|
|
|
WORKDIR /app |
|
|
|
|
|
RUN useradd -m -u 1000 user |
|
RUN chown -R user:user /app |
|
|
|
|
|
RUN mkdir -p /.cache && chown -R user:user /.cache && chmod -R 777 /.cache |
|
RUN mkdir -p /home/user/.cache && chown -R user:user /home/user/.cache |
|
|
|
|
|
COPY requirements.txt /app/ |
|
RUN pip install --no-cache-dir -r requirements.txt |
|
|
|
|
|
RUN pip install playwright && \ |
|
playwright install chromium && \ |
|
playwright install-deps chromium |
|
|
|
|
|
RUN mkdir -p /app/tokenizers/indobert-base-p1 |
|
RUN python -c "from transformers import AutoTokenizer; AutoTokenizer.from_pretrained('indobenchmark/indobert-base-p1', cache_dir='/app/tokenizers')" |
|
RUN chown -R user:user /app/tokenizers |
|
|
|
|
|
COPY . /app/ |
|
RUN chown -R user:user /app |
|
|
|
|
|
RUN mkdir -p screenshots models |
|
RUN chown -R user:user screenshots models |
|
|
|
|
|
EXPOSE 7860 |
|
|
|
|
|
USER user |
|
|
|
|
|
CMD ["python", "app.py"] |