Skip to content

Commit 899c703

Browse files
Internal change
PiperOrigin-RevId: 922850859
1 parent 76b61ae commit 899c703

4 files changed

Lines changed: 235 additions & 5 deletions

File tree

.bazelrc

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,3 +32,7 @@ build:windows --google_default_credentials=true
3232
build:macos --remote_cache=https://storage.googleapis.com/macos-cel-python-remote-cache
3333
build:macos --google_default_credentials=true
3434

35+
# Silence deprecation warnings from external dependencies (Linux and macOS)
36+
build:linux --cxxopt=-Wno-deprecated-declarations
37+
build:macos --cxxopt=-Wno-deprecated-declarations
38+

release/kokoro/release_linux.cfg

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3,3 +3,8 @@
33

44
build_file: "cel-python/release/kokoro/release_linux.sh"
55
timeout_mins: 120
6+
7+
container_properties {
8+
docker_image: "us-central1-docker.pkg.dev/kokoro-container-bakery/kokoro/ubuntu/ubuntu2204/ktcb:current"
9+
docker_sibling_containers: true
10+
}

release/kokoro/release_linux.sh

Lines changed: 215 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,14 +1,123 @@
11
#!/bin/bash
22
set -e
33

4+
5+
# Avoid virtualenv/pip trying to download/upgrade tools from PyPI on host
6+
export VIRTUALENV_NO_DOWNLOAD=1
7+
export PIP_DISABLE_PIP_VERSION_CHECK=1
8+
9+
# Pass these environment variables to the cibuildwheel Docker container
10+
export CIBW_ENVIRONMENT="VIRTUALENV_NO_DOWNLOAD=1 PIP_DISABLE_PIP_VERSION_CHECK=1"
11+
export CIBW_DEPENDENCY_VERSIONS="latest"
12+
413
# If running locally (not on Kokoro), authenticate with gcloud.
514
if [ -z "${KOKORO_BUILD_ID}" ]; then
615
if ! gcloud auth application-default print-access-token --quiet > /dev/null; then
716
gcloud auth application-default login
817
fi
918
fi
1019

11-
pip install -U keyring keyrings.google-artifactregistry-auth twine cibuildwheel
20+
# We use --no-cache-dir to force pip to download packages fresh and bypass the local
21+
# cache. In Kokoro/RBE sandboxed environments, writing to the default cache directory
22+
# (~/.cache/pip) can encounter permission/sandbox restrictions or lead to stale
23+
# dependency resolution. Disabling the cache ensures a reliable, reproducible install.
24+
pip install --no-cache-dir -U keyring keyrings.google-artifactregistry-auth twine cibuildwheel
25+
26+
# Patch cibuildwheel at runtime to bypass the RBE stdout buffering deadlock.
27+
# The RBE proxy buffers the persistent container bash stdout. By appending a 4KB
28+
# padding line to the end of every command output, we force the proxy to flush the
29+
# buffer immediately. We then read and discard this padding to keep the stream clean.
30+
OCI_PATH=$(python3 -c "import cibuildwheel.oci_container; print(cibuildwheel.oci_container.__file__)")
31+
echo "Patching cibuildwheel at $OCI_PATH..."
32+
33+
cat << 'EOF' > patch_oci.py
34+
import sys
35+
import os
36+
37+
path = sys.argv[1]
38+
with open(path, 'r') as f:
39+
content = f.read()
40+
41+
# 1. Force a 4KB flush at the end of every command execution
42+
target_write = 'printf "%04d%s\\n" $? {end_of_message}'
43+
replacement_write = 'printf "%04d%s\\n%4096s\\n" $? {end_of_message} " "'
44+
if target_write in content:
45+
content = content.replace(target_write, replacement_write)
46+
print("Patched write loop.")
47+
48+
# 2. Read and discard the 4KB padding to keep the stream clean
49+
target_read = """ # add the last line to output, without the footer
50+
output_io.write(line[0:footer_offset])
51+
output_io.flush()
52+
break"""
53+
54+
replacement_read = """ # add the last line to output, without the footer
55+
output_io.write(line[0:footer_offset])
56+
output_io.flush()
57+
# Read and discard the 4KB padding line to clear the stream!
58+
self.bash_stdout.readline()
59+
break"""
60+
61+
if target_read in content:
62+
content = content.replace(target_read, replacement_read)
63+
print("Patched read loop.")
64+
65+
# 3. Replace the deadlock-prone cat-based copy_into with native docker cp
66+
target_copy = """ else:
67+
exec_process: subprocess.Popen[bytes]
68+
self.call(["mkdir", "-p", to_path.parent])
69+
with subprocess.Popen(
70+
[
71+
self.engine.name,
72+
"exec",
73+
"-i",
74+
str(self.name),
75+
"sh",
76+
"-c",
77+
f"cat > {shell_quote(to_path)}",
78+
],
79+
stdin=subprocess.PIPE,
80+
) as exec_process:
81+
assert exec_process.stdin
82+
with open(from_path, "rb") as from_file:
83+
shutil.copyfileobj(from_file, exec_process.stdin)
84+
85+
exec_process.stdin.close()
86+
exec_process.wait()
87+
88+
if exec_process.returncode:
89+
raise subprocess.CalledProcessError(
90+
exec_process.returncode, exec_process.args, None, None
91+
)"""
92+
93+
replacement_copy = """ else:
94+
self.call(["mkdir", "-p", to_path.parent])
95+
# Use native docker cp to copy the file, avoiding stdin EOF deadlocks in RBE
96+
subprocess.run(
97+
[
98+
self.engine.name,
99+
"cp",
100+
str(from_path),
101+
f"{self.name}:{to_path}",
102+
],
103+
check=True,
104+
)"""
105+
106+
if target_copy in content:
107+
content = content.replace(target_copy, replacement_copy)
108+
print("Patched copy_into to use docker cp.")
109+
else:
110+
print("Error: target_copy not found!")
111+
sys.exit(1)
112+
113+
with open(path, 'w') as f:
114+
f.write(content)
115+
116+
print("Successfully patched oci_container.py!")
117+
EOF
118+
119+
python3 patch_oci.py "$OCI_PATH"
120+
rm patch_oci.py
12121

13122
REPO_DIR=$(mktemp -d)
14123
echo "Created temporary directory: ${REPO_DIR}"
@@ -52,17 +161,121 @@ cp -r "${SRC_DIR}"/{*,.*} . 2>/dev/null || true
52161
cp -r "${SRC_DIR}"/release/* . 2>/dev/null || true
53162
rm -rf cel_expr_python/*_test.py
54163

164+
echo "Downloading bazelisk on host..."
165+
curl -LO https://github.com/bazelbuild/bazelisk/releases/download/v1.19.0/bazelisk-linux-amd64
166+
chmod +x bazelisk-linux-amd64
167+
55168
# Check if pyproject.toml exists before running sed
56169
if [ -f pyproject.toml ]; then
57170
sed -i "" "s/\$VERSION/${VERSION}/g" pyproject.toml || sed -i "s/\$VERSION/${VERSION}/g" pyproject.toml
58171
fi
59172

173+
export CIBW_CONTAINER_ENGINE_EXTRA_ARGS="--network=host"
174+
60175
echo "Running cibuildwheel: ${CIBWHEEL_BIN}"
61176
# Default CIBWHEEL_BIN if not set
62177
if [ -z "${CIBWHEEL_BIN}" ]; then
63178
CIBWHEEL_BIN="python3 -m cibuildwheel"
64179
fi
65-
${CIBWHEEL_BIN} --platform linux --output-dir dist
180+
181+
echo "Installing diagnostic tools (psmisc, strace) on host..."
182+
# We try to install them, but don't fail the build if we can't (e.g. if no sudo or apt)
183+
sudo apt-get update && sudo apt-get install -y psmisc strace || echo "Failed to install diagnostic tools, proceeding anyway..."
184+
185+
echo "Running cibuildwheel in background..."
186+
${CIBWHEEL_BIN} --platform linux --output-dir dist > cibuildwheel.log 2>&1 &
187+
CIBW_PID=$!
188+
189+
echo "Started cibuildwheel in background with PID $CIBW_PID"
190+
191+
# Poll the log file waiting for the hang
192+
# We look for the "mkdir -p" line followed by no activity for 60 seconds.
193+
TIMEOUT=900 # 15 minutes total timeout
194+
ELAPSED=0
195+
LAST_SIZE=0
196+
STUCK_COUNT=0
197+
HANG_DETECTED=false
198+
199+
while kill -0 $CIBW_PID 2>/dev/null; do
200+
if [ -f cibuildwheel.log ]; then
201+
# Check if the log contains the test setup line
202+
if grep -q "mkdir -p" cibuildwheel.log; then
203+
CURRENT_SIZE=$(stat -c%s cibuildwheel.log)
204+
if [ "$CURRENT_SIZE" -eq "$LAST_SIZE" ]; then
205+
# Log size hasn't changed. If this persists for 60 seconds, we assume it is stuck.
206+
STUCK_COUNT=$((STUCK_COUNT + 10))
207+
echo "Log size unchanged for ${STUCK_COUNT}s at mkdir -p..."
208+
if [ $STUCK_COUNT -ge 60 ]; then
209+
HANG_DETECTED=true
210+
break
211+
fi
212+
else
213+
STUCK_COUNT=0
214+
LAST_SIZE=$CURRENT_SIZE
215+
fi
216+
fi
217+
fi
218+
219+
sleep 10
220+
ELAPSED=$((ELAPSED + 10))
221+
if [ $ELAPSED -ge $TIMEOUT ]; then
222+
echo "Timeout waiting for build to complete."
223+
break
224+
fi
225+
done
226+
227+
if [ "$HANG_DETECTED" = "true" ]; then
228+
echo "===================================================="
229+
echo "!!! DETECTED HANG AT mkdir -p !!! STARTING DIAGNOSTICS"
230+
echo "===================================================="
231+
232+
echo "=== HOST PROCESSES ==="
233+
ps aux
234+
235+
echo "=== PROCESS TREE ==="
236+
pstree -p -a || echo "pstree not available"
237+
238+
echo "=== DOCKER CONTAINERS ==="
239+
docker ps -a
240+
241+
CONTAINER_ID=$(docker ps -q | head -n 1)
242+
if [ -n "$CONTAINER_ID" ]; then
243+
echo "=== CONTAINER PROCESSES ($CONTAINER_ID) ==="
244+
docker exec "$CONTAINER_ID" ps aux
245+
246+
echo "=== CONTAINER LSOF ==="
247+
docker exec "$CONTAINER_ID" lsof || echo "lsof not available"
248+
249+
echo "=== CONTAINER DOCKER INSPECT ==="
250+
docker inspect "$CONTAINER_ID"
251+
252+
echo "=== STRACE DOCKER PROCESSES ==="
253+
DOCKER_PID=$(pgrep -f "docker start|docker exec" | head -n 1)
254+
if [ -n "$DOCKER_PID" ]; then
255+
echo "Stracing host docker process $DOCKER_PID for 15 seconds..."
256+
timeout 15 strace -p "$DOCKER_PID" -f || true
257+
fi
258+
else
259+
echo "No active docker container found!"
260+
fi
261+
262+
echo "=== LAST 100 LINES OF CIBUILDWHEEL LOG ==="
263+
tail -n 100 cibuildwheel.log
264+
265+
echo "Diagnostics complete. Killing cibuildwheel."
266+
kill -9 $CIBW_PID
267+
exit 99
268+
fi
269+
270+
# If it didn't hang, wait for it to finish and print the log
271+
wait $CIBW_PID
272+
RC=$?
273+
echo "=== CIBUILDWHEEL LOG ==="
274+
cat cibuildwheel.log
275+
if [ $RC -ne 0 ]; then
276+
echo "cibuildwheel failed with exit code $RC"
277+
exit $RC
278+
fi
66279

67280
if [ "${DRY_RUN}" = "true" ]; then
68281
echo "[DRY RUN] Skipping upload to PyPI exit gate."

release/pyproject.toml

Lines changed: 11 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -38,13 +38,21 @@ where = ["."]
3838
exclude = ["codelab*", "conformance*", "custom_ext*", "release*", "testing*", "wheelhouse*"]
3939

4040
[tool.cibuildwheel]
41-
build = "cp311-* cp312-* cp313-* cp314-*"
42-
skip = "*musllinux* *win32*"
41+
build = "cp311-*"
42+
#build = "cp311-* cp312-* cp313-* cp314-*"
43+
skip = "*musllinux* *win32* *i686*"
4344
test-command = "python {project}/cel_basic_test.py"
4445
build-verbosity = 1
4546

4647
[tool.cibuildwheel.linux]
47-
before-all = "echo 'Installing bazelisk'; curl -LO https://github.com/bazelbuild/bazelisk/releases/download/v1.19.0/bazelisk-linux-amd64 && chmod +x bazelisk-linux-amd64 && mv bazelisk-linux-amd64 /usr/local/bin/bazel"
48+
manylinux-x86_64-image = "manylinux_2_28"
49+
container-engine = "docker; disable_host_mount: True"
50+
# Google's internal Kokoro/RBE network uses a secure MITM proxy that resigns HTTPS
51+
# traffic with an internal Google CA. Since the public manylinux container does not
52+
# trust this CA, git fetches for external dependencies (like @cel-cpp) will fail
53+
# with SSL certificate errors. We disable http.sslVerify inside the container to
54+
# bypass this and allow Bazel to fetch SCM dependencies through the proxy.
55+
before-all = "git config --global http.sslVerify false && echo 'Installing bazelisk' && cp {project}/bazelisk-linux-amd64 /usr/local/bin/bazel"
4856

4957
[tool.cibuildwheel.macos]
5058
before-all = "echo 'Installing bazelisk'; brew install bazelisk"

0 commit comments

Comments
 (0)