diff --git a/gpustack_runner/runner.py.json b/gpustack_runner/runner.py.json index 0dd17ca..ef0c853 100644 --- a/gpustack_runner/runner.py.json +++ b/gpustack_runner/runner.py.json @@ -824,6 +824,28 @@ "docker_image": "gpustack/runner:corex4.2-vllm0.8.3", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.9-sglang0.5.9", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.9-sglang0.5.9", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.9", @@ -1000,6 +1022,28 @@ "docker_image": "gpustack/runner:cuda12.9-vllm0.11.2", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.8-sglang0.5.9", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.8-sglang0.5.9", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.8", diff --git a/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json b/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json index a97958a..7ff1c44 100644 --- a/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json +++ b/tests/gpustack_runner/fixtures/test_list_runners_by_backend.json @@ -846,6 +846,28 @@ "backend": "cuda" }, [ + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.9-sglang0.5.9", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.9", + "original_backend_version": "12.9.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.9-sglang0.5.9", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.9", @@ -1022,6 +1044,28 @@ "docker_image": "gpustack/runner:cuda12.9-vllm0.11.2", "deprecated": false }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/amd64", + "docker_image": "gpustack/runner:cuda12.8-sglang0.5.9", + "deprecated": false + }, + { + "backend": "cuda", + "backend_version": "12.8", + "original_backend_version": "12.8.1", + "backend_variant": "", + "service": "sglang", + "service_version": "0.5.9", + "platform": "linux/arm64", + "docker_image": "gpustack/runner:cuda12.8-sglang0.5.9", + "deprecated": false + }, { "backend": "cuda", "backend_version": "12.8",