-
Notifications
You must be signed in to change notification settings - Fork 0
/
docker-compose.yaml
59 lines (59 loc) · 1.22 KB
/
docker-compose.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
version: "3.5"
services:
main:
build:
context: ./
dockerfile: Dockerfile
ports:
- "8004:8000"
depends_on:
- inference-service
- triton
# - webapp
inference-service:
build:
context: ./inference_service
environment:
- AWS_PROFILE=default
volumes:
- ~/.aws/:/root/.aws:ro
ports:
- "8005:8000"
depends_on:
- triton
webapp:
build:
context: ./webapp
environment:
- AWS_PROFILE=default
volumes:
- ~/.aws/:/root/.aws:ro
ports:
- "8006:8080"
triton:
image: nvcr.io/nvidia/tritonserver:22.02-py3
runtime: nvidia
env_file:
- .aws.env
ports:
# part 8000 http, 8001 GRPC, 8002 Metric Service
- "8000:8000"
- "8001:8001"
- "8002:8002"
command:
[
"tritonserver",
"--model-repository=s3://aerial-detection-mlops4/model/Visdrone/Yolov7/triton-deploy/models/",
"--strict-model-config=false"
]
shm_size: 2g
ulimits:
memlock: -1
stack: 67108864
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: 1
capabilities: [gpu]