@@ -9,6 +9,7 @@ LLAMA_UPSTREAM_IMAGE ?= $(shell \
99 "$(LLAMA_SERVER_VERSION ) " "$(LLAMA_SERVER_VARIANT ) ")
1010DOCKER_IMAGE := docker/model-runner:latest
1111DOCKER_IMAGE_VLLM := docker/model-runner:latest-vllm-cuda
12+ DOCKER_IMAGE_VLLM_ROCM := docker/model-runner:latest-vllm-rocm
1213DOCKER_IMAGE_SGLANG := docker/model-runner:latest-sglang
1314DOCKER_IMAGE_MUSA := docker/model-runner:latest-musa
1415DOCKER_IMAGE_OPENVINO := docker/model-runner:latest-openvino
@@ -43,7 +44,7 @@ DOCKER_BUILD_COMMON_ARGS = \
4344.PHONY : build build-cli build-dmr build-llamacpp install-cli run clean test integration-tests e2e
4445.PHONY : validate validate-versions validate-all lint help
4546.PHONY : docker-build docker-build-multiplatform docker-run docker-run-impl
46- .PHONY : docker-build-vllm docker-run-vllm docker-build-sglang docker-run-sglang
47+ .PHONY : docker-build-vllm docker-run-vllm docker-build-vllm-rocm docker-run-vllm-rocm docker-build- sglang docker-run-sglang
4748.PHONY : docker-build-musa docker-run-musa docker-build-openvino docker-run-openvino
4849.PHONY : test-docker-ce-installation
4950.PHONY : vllm-metal-build vllm-metal-install vllm-metal-dev vllm-metal-clean
@@ -194,6 +195,23 @@ docker-build-vllm:
194195docker-run-vllm : docker-build-vllm
195196 @$(MAKE ) -s docker-run-impl DOCKER_IMAGE=$(DOCKER_IMAGE_VLLM )
196197
198+ # Build vLLM Docker image with ROCm (AMD GPU) support.
199+ # Builds upstream vLLM from source on top of rocm/vllm-dev:base — this is a
200+ # vLLM-only image (no llama.cpp), unlike the CUDA variant. Build is heavy:
201+ # expect 30-60 min and ~12-15 GB final image size.
202+ # LLAMA_SERVER_VARIANT is not consumed by the Dockerfile stages here, but
203+ # setting it to "rocm" restricts DOCKER_BUILD_PLATFORMS to linux/amd64
204+ # (vLLM ROCm has no aarch64 support).
205+ docker-build-vllm-rocm :
206+ @$(MAKE ) docker-build \
207+ DOCKER_TARGET=final-vllm-rocm \
208+ DOCKER_IMAGE=$(DOCKER_IMAGE_VLLM_ROCM ) \
209+ LLAMA_SERVER_VARIANT=rocm
210+
211+ # Run vLLM ROCm Docker container with TCP port access and mounted model storage
212+ docker-run-vllm-rocm : docker-build-vllm-rocm
213+ @$(MAKE ) -s docker-run-impl DOCKER_IMAGE=$(DOCKER_IMAGE_VLLM_ROCM )
214+
197215# Build SGLang Docker image
198216docker-build-sglang :
199217 @$(MAKE ) docker-build \
@@ -402,8 +420,10 @@ help:
402420 @echo " docker-build - Build Docker image for current platform"
403421 @echo " docker-build-multiplatform - Build Docker image for multiple platforms"
404422 @echo " docker-run - Run in Docker container with TCP port access and mounted model storage"
405- @echo " docker-build-vllm - Build vLLM Docker image"
406- @echo " docker-run-vllm - Run vLLM Docker container"
423+ @echo " docker-build-vllm - Build vLLM Docker image (CUDA)"
424+ @echo " docker-run-vllm - Run vLLM Docker container (CUDA)"
425+ @echo " docker-build-vllm-rocm - Build vLLM Docker image (ROCm / AMD GPU, source build)"
426+ @echo " docker-run-vllm-rocm - Run vLLM Docker container (ROCm / AMD GPU)"
407427 @echo " docker-build-sglang - Build SGLang Docker image"
408428 @echo " docker-run-sglang - Run SGLang Docker container"
409429 @echo " docker-build-musa - Build MUSA Docker image"
0 commit comments