File size: 885 Bytes
253fe6a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
version: '3.8'

services:
  haproxy:
    image: haproxy:latest
    volumes:
      - ./haproxy.cfg:/usr/local/etc/haproxy/haproxy.cfg:ro
    ports:
      - "7070:80"
    depends_on:
      - model1
      - model2

  model1:
    image: ghcr.io/huggingface/text-generation-inference:1.0
    command: --model-id google/flan-t5-small --disable-custom-kernels --dtype bfloat16
    environment:
      - HUGGING_FACE_HUB_TOKEN=""
    volumes:
      - ./data:/data
    cpus: '16'
    cpuset: '0-15'
    mem_limit: 48g
    privileged: true

  model2:
    image: ghcr.io/huggingface/text-generation-inference:1.0
    command: --model-id google/flan-t5-small --disable-custom-kernels --dtype bfloat16
    environment:
      - HUGGING_FACE_HUB_TOKEN=""
    volumes:
      - ./data:/data
    cpus: '16'
    cpuset: '0-15'
    mem_limit: 48g
    privileged: true

volumes:
  data:
    external: true