File size: 885 Bytes
253fe6a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 |
version: '3.8'
services:
haproxy:
image: haproxy:latest
volumes:
- ./haproxy.cfg:/usr/local/etc/haproxy/haproxy.cfg:ro
ports:
- "7070:80"
depends_on:
- model1
- model2
model1:
image: ghcr.io/huggingface/text-generation-inference:1.0
command: --model-id google/flan-t5-small --disable-custom-kernels --dtype bfloat16
environment:
- HUGGING_FACE_HUB_TOKEN=""
volumes:
- ./data:/data
cpus: '16'
cpuset: '0-15'
mem_limit: 48g
privileged: true
model2:
image: ghcr.io/huggingface/text-generation-inference:1.0
command: --model-id google/flan-t5-small --disable-custom-kernels --dtype bfloat16
environment:
- HUGGING_FACE_HUB_TOKEN=""
volumes:
- ./data:/data
cpus: '16'
cpuset: '0-15'
mem_limit: 48g
privileged: true
volumes:
data:
external: true
|