forked from fauxpilot/fauxpilot
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdocker-compose.yaml
More file actions
32 lines (32 loc) · 868 Bytes
/
docker-compose.yaml
File metadata and controls
32 lines (32 loc) · 868 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
version: '3.3'
services:
triton:
image: moyix/triton_with_ft:22.09
command: bash -c "CUDA_VISIBLE_DEVICES=${GPUS} mpirun -n 1 --allow-run-as-root /opt/tritonserver/bin/tritonserver --model-repository=/model"
shm_size: '2gb'
volumes:
- ${MODEL_DIR}:/model
ports:
- "8000:8000"
- "8001:8001"
- "8002:8002"
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
copilot_proxy:
# For dockerhub version
# image: moyix/copilot_proxy:latest
# command: python3 -m flask run --host=0.0.0.0 --port=5000
# For local build
build:
context: .
dockerfile: copilot_proxy/Dockerfile
env_file:
# Automatically created via ./setup.sh
- .env
ports:
- "${API_EXTERNAL_PORT}:5000"