From 38136c5f35d99fb6086b736f053935bb5d5adc23 Mon Sep 17 00:00:00 2001 From: Ruifeng Zheng Date: Fri, 6 Feb 2026 20:35:24 +0800 Subject: [PATCH 1/3] test --- dev/spark-test-image/python-312/Dockerfile | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/dev/spark-test-image/python-312/Dockerfile b/dev/spark-test-image/python-312/Dockerfile index c88a17399fefc..7ab630f13f895 100644 --- a/dev/spark-test-image/python-312/Dockerfile +++ b/dev/spark-test-image/python-312/Dockerfile @@ -42,22 +42,22 @@ RUN apt-get update && apt-get install -y \ libssl-dev \ openjdk-17-jdk-headless \ python3.12 \ - python3-pip \ - python3-venv \ pkg-config \ tzdata \ software-properties-common \ zlib1g-dev -ARG BASIC_PIP_PKGS="numpy pyarrow>=22.0.0 six==1.16.0 pandas==2.3.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2 pystack>=1.6.0 psutil" -# Python deps for Spark Connect -ARG CONNECT_PIP_PKGS="grpcio==1.76.0 grpcio-status==1.76.0 protobuf==6.33.5 googleapis-common-protos==1.71.0 zstandard==0.25.0 graphviz==0.20.3" - -# Install Python 3.12 packages +# Setup virtual environment ENV VIRTUAL_ENV /opt/spark-venv -RUN python3.12 -m venv $VIRTUAL_ENV +RUN python3.12 -m venv --without-pip $VIRTUAL_ENV ENV PATH="$VIRTUAL_ENV/bin:$PATH" +# Install Python 3.12 packages +RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.12 + +ARG BASIC_PIP_PKGS="numpy pyarrow>=22.0.0 six==1.16.0 pandas==2.3.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2 pystack>=1.6.0 psutil" +ARG CONNECT_PIP_PKGS="grpcio==1.76.0 grpcio-status==1.76.0 protobuf==6.33.5 googleapis-common-protos==1.71.0 zstandard==0.25.0 graphviz==0.20.3" + RUN python3.12 -m pip install $BASIC_PIP_PKGS unittest-xml-reporting $CONNECT_PIP_PKGS lxml && \ python3.12 -m pip install torch torchvision --index-url https://download.pytorch.org/whl/cpu && \ python3.12 -m pip install torcheval && \ From a47ac35380a078d2cabc2db9dc66d77aabfdbb38 Mon Sep 17 00:00:00 2001 From: Ruifeng Zheng Date: Fri, 6 Feb 2026 20:35:41 +0800 Subject: [PATCH 2/3] test --- dev/spark-test-image/python-312/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/dev/spark-test-image/python-312/Dockerfile b/dev/spark-test-image/python-312/Dockerfile index 7ab630f13f895..6a7ecbba988bc 100644 --- a/dev/spark-test-image/python-312/Dockerfile +++ b/dev/spark-test-image/python-312/Dockerfile @@ -48,7 +48,7 @@ RUN apt-get update && apt-get install -y \ zlib1g-dev # Setup virtual environment -ENV VIRTUAL_ENV /opt/spark-venv +ENV VIRTUAL_ENV=/opt/spark-venv RUN python3.12 -m venv --without-pip $VIRTUAL_ENV ENV PATH="$VIRTUAL_ENV/bin:$PATH" From eb23b229099e52db550357502237f93bff5176c3 Mon Sep 17 00:00:00 2001 From: Ruifeng Zheng Date: Sat, 7 Feb 2026 17:40:15 +0800 Subject: [PATCH 3/3] clean up --- dev/spark-test-image/python-312/Dockerfile | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/dev/spark-test-image/python-312/Dockerfile b/dev/spark-test-image/python-312/Dockerfile index 6a7ecbba988bc..fd789bd298eed 100644 --- a/dev/spark-test-image/python-312/Dockerfile +++ b/dev/spark-test-image/python-312/Dockerfile @@ -45,7 +45,10 @@ RUN apt-get update && apt-get install -y \ pkg-config \ tzdata \ software-properties-common \ - zlib1g-dev + zlib1g-dev \ + && apt-get autoremove --purge -y \ + && apt-get clean \ + && rm -rf /var/lib/apt/lists/* # Setup virtual environment ENV VIRTUAL_ENV=/opt/spark-venv