File size: 2,043 Bytes
4f1e963
222d86d
4f1e963
 
 
 
 
0918e19
 
4f1e963
 
 
 
 
 
0918e19
 
4f1e963
 
 
 
 
 
 
 
 
 
 
0918e19
4f1e963
 
 
0918e19
4f1e963
0918e19
4f1e963
 
 
 
0918e19
55eb099
4f1e963
 
 
 
 
 
 
797f976
4f1e963
c02d909
0918e19
4f1e963
 
0918e19
c02d909
e7f7dfb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
FROM python:3.11-slim-bookworm

# Metadata as per https://github.com/opencontainers/image-spec/blob/master/annotations.md
LABEL org.opencontainers.image.authors="Bram Vanroy"
LABEL org.opencontainers.image.title="MAchine Translation Evaluation Online - Demo"

# Avoid prompts from apt
ENV DEBIAN_FRONTEND=noninteractive

# Install dependencies in a single RUN command to reduce image layers
RUN apt-get update && apt-get install -y --no-install-recommends \
    build-essential \
    curl \
    git \
    && apt-get clean \
    && rm -rf /var/lib/apt/lists/*

# Create a non-root user
RUN useradd -m -u 1000 mateo_user
USER mateo_user
ENV HOME="/home/mateo_user"

# Environment variables
ENV PORT=7860 \
    SERVER="localhost" \
    HF_HUB_ENABLE_HF_TRANSFER=1 \
    PATH="${HOME}/.local/bin:${PATH}" \
    USE_CUDA=false

WORKDIR ${HOME}/mateo

# Clone the repository
RUN git clone https://github.com/BramVanroy/mateo-demo.git
WORKDIR mateo-demo

# Install Python dependencies with conditional torch installation
RUN python -m pip install --no-cache-dir --upgrade pip wheel setuptools \
    && python -m pip install --no-cache-dir torch==2.2.1+cpu -f https://download.pytorch.org/whl/torch \
    && python -m pip install --no-cache-dir --upgrade .

# Pre-download default models
RUN huggingface-cli download bert-base-multilingual-cased model.safetensors tokenizer.json vocab.txt; \
    huggingface-cli download facebook/nllb-200-distilled-600M pytorch_model.bin sentencepiece.bpe.model tokenizer.json; \
    python -c "import comet; from comet import download_model; download_model('Unbabel/wmt22-comet-da')"; \
    python -c "import evaluate; evaluate.load('bleurt', 'BLEURT-20')"

# Expose the port the app runs on
EXPOSE $PORT

# Healthcheck to ensure the service is running
HEALTHCHECK CMD curl --fail http://$SERVER:$PORT/_stcore/health || exit 1

# Set the working directory to the Streamlit app
WORKDIR src/mateo_st

# Launch app
CMD streamlit run 01_🎈_MATEO.py --server.port $PORT --server.enableXsrfProtection false -- --no_cuda