diff --git a/model-engine/model_engine_server/inference/vllm/Dockerfile.vllm b/model-engine/model_engine_server/inference/vllm/Dockerfile.vllm index ebb1b3fb..58497cc8 100644 --- a/model-engine/model_engine_server/inference/vllm/Dockerfile.vllm +++ b/model-engine/model_engine_server/inference/vllm/Dockerfile.vllm @@ -12,6 +12,9 @@ RUN apt-get update \ WORKDIR /workspace +ARG VLLM_VERSION +RUN pip install --no-cache-dir "vllm[audio]==${VLLM_VERSION}" + RUN wget https://github.com/peak/s5cmd/releases/download/v2.2.1/s5cmd_2.2.1_Linux-64bit.tar.gz RUN tar -xvzf s5cmd_2.2.1_Linux-64bit.tar.gz