diff --git a/gpustack_runner/runner.py.json b/gpustack_runner/runner.py.json index f62a61f..9ba9f12 100644 --- a/gpustack_runner/runner.py.json +++ b/gpustack_runner/runner.py.json @@ -846,6 +846,28 @@ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.9", @@ -1011,6 +1033,28 @@ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.8", @@ -1209,6 +1253,28 @@ "docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20", "deprecated": true }, + { + "backend": "cuda", + "backend_version": "12.6", + "original_backend_version": "12.6.3", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.6", + "original_backend_version": "12.6.3", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.6", diff --git a/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json b/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json index f56a53e..509c831 100644 --- a/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json +++ b/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json @@ -868,6 +868,28 @@ "docker_image": "gpustack/runner:cuda12.9-sglang0.5.6.post2", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.9-vllm0.14.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.9", @@ -1033,6 +1055,28 @@ "docker_image": "gpustack/runner:cuda12.8-sglang0.5.4.post3", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.8-vllm0.14.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.8", @@ -1231,6 +1275,28 @@ "docker_image": "gpustack/runner:cuda12.8-voxbox0.0.20", "deprecated": true }, + { + "backend": "cuda", + "backend_version": "12.6", + "original_backend_version": "12.6.3", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.6", + "original_backend_version": "12.6.3", + "backend_variant": "", + "service": "vllm", + "service_version": "0.14.1", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.6-vllm0.14.1", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.6",