-
Notifications
You must be signed in to change notification settings - Fork 2
/
torchserve-cuda.yml
38 lines (38 loc) · 1003 Bytes
/
torchserve-cuda.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
---
networks:
gamutrf:
driver: bridge
driver_opts:
com.docker.network.driver.mtu: 9000
default:
external: true
name: none
services:
torchserve:
restart: always
image: iqtlabs/cuda-torchserve:v0.0.9
healthcheck:
start_period: 120s
networks:
- gamutrf
ports:
- '8080:8080'
- '8081:8081'
volumes:
- '${VOL_PREFIX}/model_store:/model_store'
- '/root/.cache/pip:/root/.cache/pip'
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: 1
capabilities: [gpu]
command:
# can be multiple models
# e.g. mini2_snr=mini2_snr.mar,another_mini2_snr=another_mini2_snr.mar
# As of torchserve v11, you will need to add setuptools==69.5.1
# to your requirements.txt when generating a MAR file
# https://github.com/pytorch/serve/issues/3176
- --disable-token-auth
- --models torchsig_model=torchsig_model.mar