OI / Dockerfile
JPBianchi's picture
added Linux apps
301e370
FROM python:3.10-slim
ENV PYTHONDONTWRITEBYTECODE 1
# ^ saves space by not writing .pyc files
ENV PYTHONUNBUFFERED 1
# ^ ensures that the output from the Python app is sent straight to the terminal without being buffered -> real time monitoring
RUN apt-get update && apt-get install -y \
unzip \
curl \
wget \
git git-lfs \
bash \
&& rm -rf /var/lib/apt/lists/*2
ENV ENVIRONMENT=dev
COPY ./app /app
WORKDIR .
RUN mkdir -p data
RUN mkdir -p assets/data
RUN pip install --no-cache-dir --upgrade -r app/requirements.txt
# ^ no caching of the packages to save space
# pip install guardrails-ai first
# https://huggingface.co/docs/hub/spaces-sdks-docker#secrets
RUN --mount=type=secret,id=GUARDRAILS_TOKEN,mode=0444,required=true \
guardrails configure --token $(cat /run/secrets/GUARDRAILS_TOKEN) --no-metrics True
RUN guardrails hub install hub://guardrails/regex_match
RUN guardrails hub install hub://guardrails/toxic_language
RUN guardrails hub install hub://guardrails/detect_pii
RUN guardrails hub install hub://guardrails/qa_relevance_llm_eval
# RUN python -c "import nltk; nltk.download('stopwords')"
# ^ to fix runtime error, see https://github.com/run-llama/llama_index/issues/10681
# it didn't work, I had to do chmod below (as also suggested in the article)
RUN chmod -R 777 /usr/local/lib/python3.10/site-packages/llama_index/legacy/_static/nltk_cache
ENV TRANSFORMERS_CACHE=/usr/local/lib/python3.10/site-packages/llama_index/legacy/_static/nltk_cache
# ^ not elegant but it works
# HF warning says that TRANSFORMERS_CACHE will be deprecated in transformers v5, and advise to use HF_HOME
CMD ["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "7860"]