llama2-docker-compose / docker-compose_flant5.yaml
Arun Kumar Tiwary
Upload folder using huggingface_hub
253fe6a verified
version: '3.8'
services:
haproxy:
image: haproxy:latest
volumes:
- ./haproxy.cfg:/usr/local/etc/haproxy/haproxy.cfg:ro
ports:
- "7070:80"
depends_on:
- model1
- model2
model1:
image: ghcr.io/huggingface/text-generation-inference:1.0
command: --model-id google/flan-t5-small --disable-custom-kernels --dtype bfloat16
environment:
- HUGGING_FACE_HUB_TOKEN=""
volumes:
- ./data:/data
cpus: '16'
cpuset: '0-15'
mem_limit: 48g
privileged: true
model2:
image: ghcr.io/huggingface/text-generation-inference:1.0
command: --model-id google/flan-t5-small --disable-custom-kernels --dtype bfloat16
environment:
- HUGGING_FACE_HUB_TOKEN=""
volumes:
- ./data:/data
cpus: '16'
cpuset: '0-15'
mem_limit: 48g
privileged: true
volumes:
data:
external: true