diff --git a/gpustack_runner/runner.py.json b/gpustack_runner/runner.py.json index d895971..8bfaccf 100644 --- a/gpustack_runner/runner.py.json +++ b/gpustack_runner/runner.py.json @@ -978,6 +978,28 @@ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.17.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.17.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.9", @@ -1253,6 +1275,28 @@ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3", "deprecated": true }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.17.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.17.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.8", diff --git a/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json b/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json index b9b5ab0..fc6c1e4 100644 --- a/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json +++ b/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json @@ -1000,6 +1000,28 @@ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.17.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.17.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.9", @@ -1275,6 +1297,28 @@ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3", "deprecated": true }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.17.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.17.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.17.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.8",