cipherstash · tobyhede · Apr 8, 2026 · Apr 8, 2026 · Apr 9, 2026 · Apr 9, 2026
diff --git a/.github/workflows/benchmark.yml b/.github/workflows/benchmark.yml
@@ -0,0 +1,77 @@
+name: "Scheduled Benchmarks (Tier 2)"
+
+on:
+  schedule:
+    - cron: '0 3 * * 1'   # Every Monday 03:00 UTC
+  workflow_dispatch:
+
+# Prevent a scheduled run from racing a manual dispatch for the same ports.
+concurrency:
+  group: scheduled-benchmarks
+  cancel-in-progress: false
+
+env:
+  # Matches test-eql.yml — forces JS-based composite actions onto Node 24.
+  FORCE_JAVASCRIPT_ACTIONS_TO_NODE24: "true"
+
+jobs:
+  benchmark:
+    name: "100K dataset benchmark (Postgres 17)"
+    runs-on: ubuntu-latest
+    timeout-minutes: 60
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install postgresql-client
+        # generate.sh uses psql directly against Postgres (port 7433) and Proxy
+        # (port 6433). jdx/mise-action only installs Rust + Python.
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y postgresql-client
+
+      - uses: jdx/mise-action@v3
+        with:
+          version: 2026.4.0
+          install: true
+          cache: true
+
+      - name: Write Proxy credentials to .env
+        env:
+          CS_CLIENT_ACCESS_KEY: ${{ secrets.CS_CLIENT_ACCESS_KEY }}
+          CS_DEFAULT_KEYSET_ID: ${{ secrets.CS_DEFAULT_KEYSET_ID }}
+          CS_CLIENT_KEY: ${{ secrets.CS_CLIENT_KEY }}
+          CS_CLIENT_ID: ${{ secrets.CS_CLIENT_ID }}
+          CS_WORKSPACE_CRN: ${{ secrets.CS_WORKSPACE_CRN }}
+        run: |
+          {
+            printf 'CS_CLIENT_ACCESS_KEY=%s\n' "$CS_CLIENT_ACCESS_KEY"
+            printf 'CS_DEFAULT_KEYSET_ID=%s\n' "$CS_DEFAULT_KEYSET_ID"
+            printf 'CS_CLIENT_KEY=%s\n' "$CS_CLIENT_KEY"
+            printf 'CS_CLIENT_ID=%s\n' "$CS_CLIENT_ID"
+            printf 'CS_WORKSPACE_CRN=%s\n' "$CS_WORKSPACE_CRN"
+          } > tests/benchmarks/.env
+
+      - name: Bring up Postgres + Proxy
+        run: mise run bench:up
+
+      - name: Generate 100K dataset
+        run: mise run bench:generate
+
+      - name: Run Tier 2 benchmark suite
+        run: |
+          BENCH_REPORT_DATE="$(date -u +%Y-%m-%d)-${{ github.run_id }}"
+          export BENCH_REPORT_DATE
+          mise run bench:full
+
+      - name: Tear down containers
+        if: always()
+        run: mise run bench:down
+
+      - name: Upload benchmark report
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: benchmark-report-${{ github.run_id }}
+          path: tests/benchmarks/reports/
+          retention-days: 90
diff --git a/mise.toml b/mise.toml
@@ -14,7 +14,7 @@
 "python" = "3.13"
 
 [task_config]
-includes = ["tasks", "tasks/postgres.toml"]
+includes = ["tasks", "tasks/postgres.toml", "tasks/bench.toml"]
 
 [env]
 POSTGRES_DB = "cipherstash"

diff --git a/tasks/bench.toml b/tasks/bench.toml
@@ -0,0 +1,35 @@
+["bench:up"]
+description = "Start Postgres + Proxy for benchmark data generation"
+dir = "{{config_root}}"
+run = """
+if [ ! -f tests/benchmarks/.env ]; then
+  echo "ERROR: tests/benchmarks/.env missing. Copy .env.example and fill in credentials." >&2
+  exit 1
+fi
+docker compose --env-file tests/benchmarks/.env -f tests/benchmarks/docker-compose.yml up -d --wait
+"""
+
+["bench:down"]
+description = "Stop benchmark Postgres + Proxy"
+dir = "{{config_root}}"
+run = """
+docker compose -f tests/benchmarks/docker-compose.yml down -v
+"""
+
+["bench:generate"]
+description = "Generate 100K encrypted bench dataset (requires bench:up first)"
+# `build` produces release/cipherstash-encrypt.sql, which generate.sh
+# installs into the bench Postgres container before applying schema.sql.
+depends = ["build"]
+dir = "{{config_root}}"
+run = """
+tests/benchmarks/generate.sh 100k
+"""
+
+["bench:full"]
+description = "Run full Tier 2 benchmark suite against bench-postgres"
+dir = "{{config_root}}/tests/sqlx"
+env = { DATABASE_URL = "postgresql://cipherstash:password@localhost:7433/cipherstash" }
+run = """
+cargo test --test bench_perf_tests run_all_benchmarks -- --ignored --nocapture
+"""
diff --git a/tests/benchmarks/.env.example b/tests/benchmarks/.env.example
@@ -0,0 +1,7 @@
+# CipherStash Proxy credentials
+# Get these from https://dashboard.cipherstash.com
+CS_CLIENT_ACCESS_KEY=
+CS_DEFAULT_KEYSET_ID=
+CS_CLIENT_KEY=
+CS_CLIENT_ID=
+CS_WORKSPACE_CRN=
diff --git a/tests/benchmarks/.gitignore b/tests/benchmarks/.gitignore
@@ -0,0 +1,6 @@
+# Generated reports (too large for git, regenerated on demand)
+reports/*
+!reports/.gitkeep
+
+# Local Proxy credentials
+.env
diff --git a/tests/benchmarks/README.md b/tests/benchmarks/README.md
@@ -0,0 +1,48 @@
+# EQL Scheduled Benchmarks (Tier 2)
+
+Heavy-weight performance benchmarks that run weekly in CI against 100K-row
+encrypted datasets. Complements the Tier 1 tests in `tests/sqlx/tests/bench_*`.
+
+## What this is
+
+- Brings up Postgres + CipherStash Proxy via docker-compose
+- Inserts 100K plaintext rows through the Proxy (which encrypts them)
+- Runs each P0/P1/P2 query pattern 10 times
+- Reads `pg_stat_statements` for statistical aggregates
+- Outputs JSON + Markdown reports
+
+## Local usage
+
+```bash
+# Populate credentials
+cp tests/benchmarks/.env.example tests/benchmarks/.env
+# Edit .env with your CipherStash credentials
+
+# Start Postgres + Proxy
+mise run bench:up
+
+# Build EQL and generate 100K dataset (bench:generate depends on build)
+mise run bench:generate
+
+# Run the full Tier 2 suite
+mise run bench:full
+
+# Results land in tests/benchmarks/reports/
+```
+
+## CI usage
+
+Runs automatically every Monday at 03:00 UTC via
+`.github/workflows/benchmark.yml`. Also manually invocable from the
+GitHub Actions UI (Run workflow button).
+
+## Why a separate workflow
+
+- 100K generation takes ~100 seconds via the Proxy
+- The slowest pattern (`bench_ore_order_by_limit`) takes several seconds per run on 100K rows
+- Regular PR CI must stay under 10 minutes; this suite would blow that budget
+
+## Output
+
+`tests/benchmarks/reports/benchmark-YYYY-MM-DD.{json,md}` — uploaded as
+GitHub Actions artifact named `benchmark-report-<run-id>`.
diff --git a/tests/benchmarks/docker-compose.yml b/tests/benchmarks/docker-compose.yml
@@ -0,0 +1,59 @@
+services:
+  postgres:
+    image: postgres:17
+    container_name: bench-postgres
+    command: >
+      postgres
+      -c track_functions=all
+      -c shared_preload_libraries=pg_stat_statements
+      -c pg_stat_statements.track=all
+      -c pg_stat_statements.max=10000
+    ports:
+      - "127.0.0.1:7433:5432"
+    environment:
+      POSTGRES_DB: cipherstash
+      POSTGRES_USER: cipherstash
+      POSTGRES_PASSWORD: password
+    healthcheck:
+      test: ["CMD-SHELL", "pg_isready -U cipherstash"]
+      interval: 1s
+      timeout: 5s
+      retries: 10
+    networks:
+      - bench
+
+  proxy:
+    image: cipherstash/proxy:latest
+    container_name: bench-proxy
+    ports:
+      - "127.0.0.1:6433:6432"
+    environment:
+      CS_DATABASE__NAME: cipherstash
+      CS_DATABASE__USERNAME: cipherstash
+      CS_DATABASE__PASSWORD: password
+      CS_DATABASE__HOST: postgres
+      CS_DATABASE__PORT: 5432
+      # EQL install is performed explicitly by generate.sh before schema.sql runs.
+      # Leaving Proxy's own install off avoids racing against generate.sh.
+      CS_DATABASE__INSTALL_EQL: "false"
+      CS_CLIENT_ACCESS_KEY: ${CS_CLIENT_ACCESS_KEY}
+      CS_DEFAULT_KEYSET_ID: ${CS_DEFAULT_KEYSET_ID}
+      CS_CLIENT_KEY: ${CS_CLIENT_KEY}
+      CS_CLIENT_ID: ${CS_CLIENT_ID}
+      CS_WORKSPACE_CRN: ${CS_WORKSPACE_CRN}
+    healthcheck:
+      # Probe the Proxy's pg-protocol listener (no auth handshake required).
+      # busybox `nc` is present in the cipherstash/proxy image.
+      test: ["CMD-SHELL", "nc -z localhost 6432"]
+      interval: 1s
+      timeout: 5s
+      retries: 30
+    depends_on:
+      postgres:
+        condition: service_healthy
+    networks:
+      - bench
+
+networks:
+  bench:
+    driver: bridge
diff --git a/tests/benchmarks/generate.sh b/tests/benchmarks/generate.sh
@@ -0,0 +1,58 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+# Generates a 100K-row encrypted bench dataset via CipherStash Proxy.
+# No dump is written in v1 — the Tier 2 workflow regenerates fresh each run.
+#
+# Prerequisites:
+#   - mise run build  (produces release/cipherstash-encrypt.sql)
+#   - docker compose -f tests/benchmarks/docker-compose.yml up -d --wait
+#   - tests/benchmarks/.env populated with CipherStash credentials
+
+REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+EQL_SQL="$REPO_ROOT/release/cipherstash-encrypt.sql"
+SCALE="${1:-100k}"
+
+case "$SCALE" in
+    100k) ROWS=100000 ;;
+    *) echo "Unsupported scale: $SCALE (only 100k in v1)" >&2; exit 1 ;;
+esac
+
+if [ ! -f "$EQL_SQL" ]; then
+    echo "ERROR: $EQL_SQL not found. Run 'mise run build' first." >&2
+    exit 1
+fi
+
+PG_URL="postgresql://cipherstash:password@localhost:7433/cipherstash"
+PROXY_URL="postgresql://cipherstash:password@localhost:6433/cipherstash"
+
+echo "==> Installing EQL into bench-postgres"
+psql "$PG_URL" -v ON_ERROR_STOP=1 -f "$EQL_SQL" >/dev/null
+
+echo "==> Applying bench schema and Proxy search configuration"
+psql "$PG_URL" -v ON_ERROR_STOP=1 -f "$SCRIPT_DIR/schema.sql"
+
+echo "==> Inserting $ROWS plaintext rows through Proxy (this encrypts them)"
+# generate_series emits plaintext rows; Proxy intercepts and encrypts each
+# column per the search config applied in schema.sql.
+psql "$PROXY_URL" -v ON_ERROR_STOP=1 -c "
+INSERT INTO bench (encrypted_text, encrypted_int, encrypted_bigint)
+SELECT
+    ('text_' || (((gs - 1) % 1000) + 1))::text,
+    (((gs - 1) % 1000) + 1)::int,
+    (((gs - 1) % 1000) + 1)::bigint * 1000000000
+FROM generate_series(1, $ROWS) AS gs;
+"
+
+echo "==> Creating indexes and running ANALYZE"
+psql "$PG_URL" -v ON_ERROR_STOP=1 -c "
+CREATE INDEX IF NOT EXISTS bench_text_hmac_idx   ON bench USING hash  (eql_v2.hmac_256(encrypted_text));
+CREATE INDEX IF NOT EXISTS bench_text_ore_idx    ON bench USING btree (encrypted_text eql_v2.encrypted_operator_class);
+CREATE INDEX IF NOT EXISTS bench_int_ore_idx     ON bench USING btree (encrypted_int eql_v2.encrypted_operator_class);
+CREATE INDEX IF NOT EXISTS bench_bigint_ore_idx  ON bench USING btree (encrypted_bigint eql_v2.encrypted_operator_class);
+CREATE INDEX IF NOT EXISTS bench_text_bloom_idx  ON bench USING gin   (eql_v2.bloom_filter(encrypted_text));
+ANALYZE bench;
+"
+
+echo "==> Done. Rows: $ROWS"
diff --git a/tests/benchmarks/reports/.gitkeep b/tests/benchmarks/reports/.gitkeep
diff --git a/tests/benchmarks/schema.sql b/tests/benchmarks/schema.sql
@@ -0,0 +1,35 @@
+-- Bench schema for Tier 2 benchmarks.
+-- Applied against the bench-postgres container AFTER EQL has been explicitly
+-- installed by generate.sh (see Task 4 — generate.sh installs
+-- release/cipherstash-encrypt.sql directly, not relying on Proxy's async install).
+
+DROP TABLE IF EXISTS bench;
+
+CREATE TABLE bench (
+    id BIGINT GENERATED ALWAYS AS IDENTITY PRIMARY KEY,
+    encrypted_text eql_v2_encrypted,
+    encrypted_int eql_v2_encrypted,
+    encrypted_bigint eql_v2_encrypted
+);
+
+-- Proxy search configuration: tells Proxy which index terms to generate
+-- for each column when plaintext is inserted.
+--
+-- Signature: eql_v2.add_search_config(table, column, index, cast_as)
+-- (see src/config/functions.sql). add_search_config calls activate_config
+-- internally when migrating=false, so no explicit activate_config call.
+
+-- text column: equality (hmac), pattern match (bloom), ordering (ore)
+SELECT eql_v2.add_search_config('bench', 'encrypted_text', 'unique', 'text');
+SELECT eql_v2.add_search_config('bench', 'encrypted_text', 'match',  'text');
+SELECT eql_v2.add_search_config('bench', 'encrypted_text', 'ore',    'text');
+
+-- integer column: equality + ORE range/ordering
+SELECT eql_v2.add_search_config('bench', 'encrypted_int', 'unique', 'int');
+SELECT eql_v2.add_search_config('bench', 'encrypted_int', 'ore',    'int');
+
+-- bigint column: equality + ORE range/ordering
+SELECT eql_v2.add_search_config('bench', 'encrypted_bigint', 'unique', 'big_int');
+SELECT eql_v2.add_search_config('bench', 'encrypted_bigint', 'ore',    'big_int');
+
+-- Indexes (created after data load in generate.sh, after ANALYZE)