-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathdocker-compose.yml
55 lines (53 loc) · 1.33 KB
/
docker-compose.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
version: '3.8'
services:
web:
build: ./fastapi_server
restart: always
command: uvicorn main:api --host 0.0.0.0 --port 8008 --log-level info --root-path /api --workers 32
environment:
- STANDARD_SAMPLING_RATE
- STANDARD_BATCH_SIZE
- INFERENCE_SERVER_HOST
- DEFAULT_API_KEY_VALUE
- ENABLE_LOGGING
- AZURE_STORAGE_ACCESS_KEY
- AZURE_BLOB_STORE_NAME
- AZURE_BLOB_CONTAINER
ports:
- 8008:8008
depends_on:
- triton
volumes:
- ./fastapi_server:/app
triton:
build:
context: ./triton_server
shm_size: '16gb'
args:
- INDICPUNCT_COMMIT_HASH=${INDICPUNCT_COMMIT_HASH}
restart: always
command: tritonserver --model-repository=/models/model_repository --log-file=/logs/log.txt
environment:
- TRITON_LOG_FILE
- INDICPUNCT_COMMIT_HASH
expose:
- 8000
- 8001
ports:
- 8000:8000
- 8001:8001
- 8002:8002
volumes:
- ./triton_server/triton-model-repository/end2end/model_repository:/models/model_repository
- ${TRITON_LOG_FILE}:/logs/
shm_size: '16gb'
ulimits:
memlock: -1
stack: 67108864
deploy:
resources:
reservations:
devices:
- driver: nvidia
device_ids: ['0']
capabilities: [gpu]