mirror of
https://github.com/1Panel-dev/1Panel.git
synced 2026-01-06 23:24:23 +08:00
32 lines
No EOL
730 B
YAML
32 lines
No EOL
730 B
YAML
services:
|
|
tensorrt-llm:
|
|
image: nvcr.io/nvidia/tensorrt-llm/release:${VERSION}
|
|
container_name: ${CONTAINER_NAME}
|
|
restart: always
|
|
runtime: nvidia
|
|
deploy:
|
|
resources:
|
|
reservations:
|
|
devices:
|
|
- driver: nvidia
|
|
count: all
|
|
capabilities: [gpu]
|
|
networks:
|
|
- 1panel-network
|
|
volumes:
|
|
- ${MODEL_PATH}:/models
|
|
ports:
|
|
- ${PANEL_APP_PORT_HTTP}:8000
|
|
ipc: host
|
|
ulimits:
|
|
memlock:
|
|
soft: -1
|
|
hard: -1
|
|
nofile:
|
|
soft: 65535
|
|
hard: 65535
|
|
stack: 67108864
|
|
command: bach -c "trtllm-serve /models/${MODEL_NAME} --host 0.0.0.0 --port 8000"
|
|
networks:
|
|
1panel-network:
|
|
external: true |