brownjuly2003-code
diff --git a/‎chroma_data/chroma.sqlite3‎
0 Bytes b/‎chroma_data/chroma.sqlite3‎
0 Bytes
diff --git a/‎chroma_data/fc9668d3-4384-40d9-aa8d-0010807a5a68/data_level0.bin‎
0 Bytes b/‎chroma_data/fc9668d3-4384-40d9-aa8d-0010807a5a68/data_level0.bin‎
0 Bytes
diff --git a/‎chroma_data/fc9668d3-4384-40d9-aa8d-0010807a5a68/length.bin‎
Lines changed: 1 addition & 1 deletion b/‎chroma_data/fc9668d3-4384-40d9-aa8d-0010807a5a68/length.bin‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/NEXT_SESSION.md‎
Lines changed: 24 additions & 0 deletions b/‎docs/NEXT_SESSION.md‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎scripts/p3f_acceptance.py‎
Lines changed: 171 additions & 0 deletions b/‎scripts/p3f_acceptance.py‎
Lines changed: 171 additions & 0 deletions
diff --git a/‎src/nl_sql/agent/nodes/_support.py‎
Lines changed: 24 additions & 0 deletions b/‎src/nl_sql/agent/nodes/_support.py‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎tests/agent/nodes/test_schema_link_hints.py‎
Lines changed: 58 additions & 0 deletions b/‎tests/agent/nodes/test_schema_link_hints.py‎
Lines changed: 58 additions & 0 deletions
@@ -1 +1 @@
-invalid type: string "Table: PlaylistTrack (rows=8715)\nPrimary key: PlaylistId, TrackId\nColumns:\n  - PlaylistId: INTEGER [PK NOT NULL] | nulls=0 (0.0%), distinct=14 | samples: 1, 8, 5\n  - TrackId: INTEGER [PK NOT NULL] | nulls=0 (0.0%), distinct=3503 | samples: 3403, 3404, 3408\nForeign keys:\n  - (TrackId) -> Track(TrackId)\n  - (PlaylistId) -> Playlist(PlaylistId)", expected a boolean�������
+invalid type: string "Table: Track (rows=3503)\nPrimary key: TrackId\nColumns:\n  - TrackId: INTEGER [PK NOT NULL] | nulls=0 (0.0%), distinct=3503 | samples: 1, 2, 3\n  - Name: NVARCHAR(200) [NOT NULL] | nulls=0 (0.0%), distinct=3257 | samples: '2 Minutes To Midnight', 'Hallowed Be Thy Name', 'Iron Maiden'\n  - AlbumId: INTEGER [NULL] | nulls=0 (0.0%), distinct=347 | samples: 141, 23, 73\nn�������
@@ -3,6 +3,30 @@
 > Один лист, без воды. Берёшь, делаешь, обновляешь `SESSION_HANDOFF.md`,
 > переписываешь этот файл под следующий sprint.
 
+## 2026-05-23 continuation — P3.F harness + qid 1404 narrow hint
+
+**Сделано:**
+- Добавлен qid-level acceptance harness: `scripts/p3f_acceptance.py`.
+  Он проверяет report JSON по двум P3.F target qids:
+  - `1404`: требует `event.type`, запрещает `expense.expense_description/type`.
+  - `207`: требует `connected.atom_id`, запрещает `connected.bond_id`.
+- Текущий v20 report ожидаемо красный по обоим target qids:
+  `uv run python scripts/p3f_acceptance.py --report eval/reports/2026-05-22/v20-kimi-k2-thinking-merged.json`.
+- Добавлен узкий schema-link hint в `render_schema_block()` только для
+  `student_club` + вопроса про `expense` type/event. Это не generic FK booster.
+- In-memory smoke без записи report: config C на `qid 1404` теперь дал
+  `match=True`, pred SQL использует `event.type`.
+- Gate: `uv run pytest -q` → 315 passed; `uv run ruff check src tests scripts app` clean;
+  `uv run mypy --strict src` clean; `git diff --check` clean, но Git печатает
+  Windows autocrlf warning для `_support.py`. Байтовая проверка: все изменённые
+  текстовые файлы `CRLF=0`.
+
+**Следующее:**
+1. Прогнать durable exact-qid report: `eval_baseline.py --config C --only-qids 1404,207 --report-suffix p3f-targets`.
+2. Прогнать `scripts/p3f_acceptance.py --report <that-report> --require-pass`.
+3. Если `1404` подтверждён, не трогать generic FK linker; отдельно проектировать `207`,
+   потому натуральный `connected.bond_id` path всё ещё опасен.
+
 ## 2026-05-22 v20 — **87.5% EA verified** (BIRD-official set scoring), above #1 paid SOTA by +5.55pp
 
 **Состояние:**
 
@@ -0,0 +1,171 @@
+"""Qid-level acceptance harness for the narrow P3.F JOIN-path work.
+
+This script checks a finished eval/voting report. It does not call providers,
+does not run a broad residue sweep, and does not implement the JOIN linker.
+
+Usage:
+    uv run python scripts/p3f_acceptance.py \
+        --report eval/reports/2026-05-22/v20-kimi-k2-thinking-merged.json
+    uv run python scripts/p3f_acceptance.py --report <candidate>.json --require-pass
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import sys
+from collections.abc import Mapping
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Any
+
+from sqlglot import exp, parse_one
+from sqlglot.errors import ParseError
+
+ColumnRef = tuple[str, str]
+
+
+@dataclass(frozen=True)
+class AcceptanceTarget:
+    qid: int
+    label: str
+    required_columns: tuple[ColumnRef, ...]
+    forbidden_columns: tuple[ColumnRef, ...] = ()
+
+
+@dataclass(frozen=True)
+class AcceptanceResult:
+    qid: int
+    label: str
+    accepted: bool
+    match: bool
+    reasons: tuple[str, ...]
+    pred_sql: str
+
+
+TARGETS: tuple[AcceptanceTarget, ...] = (
+    AcceptanceTarget(
+        qid=1404,
+        label="student_club expense type must come from event.type",
+        required_columns=(("event", "type"),),
+        forbidden_columns=(("expense", "expense_description"), ("expense", "type")),
+    ),
+    AcceptanceTarget(
+        qid=207,
+        label="toxicology double bond path must not shortcut through connected.bond_id",
+        required_columns=(("connected", "atom_id"),),
+        forbidden_columns=(("connected", "bond_id"),),
+    ),
+)
+
+
+def evaluate_report(report: Mapping[str, Any]) -> list[AcceptanceResult]:
+    records = _records_by_qid(report)
+    missing = [target.qid for target in TARGETS if target.qid not in records]
+    if missing:
+        raise ValueError(f"missing target qids: {missing}")
+    return [_evaluate_record(records[target.qid], target) for target in TARGETS]
+
+
+def main(argv: list[str] | None = None) -> int:
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument("--report", type=Path, required=True)
+    parser.add_argument(
+        "--require-pass",
+        action="store_true",
+        help="return exit code 1 unless every P3.F target is accepted",
+    )
+    args = parser.parse_args(argv)
+
+    report = json.loads(args.report.read_text(encoding="utf-8"))
+    try:
+        results = evaluate_report(report)
+    except ValueError as exc:
+        print(f"[error] {exc}", file=sys.stderr)
+        return 3
+
+    print(f"Report: {args.report}")
+    for result in results:
+        flag = "PASS" if result.accepted else "FAIL"
+        print(f"{flag} qid={result.qid} match={result.match} - {result.label}")
+        for reason in result.reasons:
+            print(f"  - {reason}")
+
+    if args.require_pass and any(not result.accepted for result in results):
+        return 1
+    return 0
+
+
+def _evaluate_record(
+    record: Mapping[str, Any],
+    target: AcceptanceTarget,
+) -> AcceptanceResult:
+    pred_sql = str(record.get("pred_sql") or "")
+    match = bool(record.get("match"))
+    columns, parse_error = _qualified_columns(pred_sql)
+    reasons: list[str] = []
+    if not match:
+        reasons.append("EA match is false")
+    if parse_error:
+        reasons.append(parse_error)
+    for table, column in target.required_columns:
+        if (table, column) not in columns:
+            reasons.append(f"missing required column {table}.{column}")
+    for table, column in target.forbidden_columns:
+        if (table, column) in columns:
+            reasons.append(f"forbidden column {table}.{column} is present")
+    return AcceptanceResult(
+        qid=target.qid,
+        label=target.label,
+        accepted=not reasons,
+        match=match,
+        reasons=tuple(reasons),
+        pred_sql=pred_sql,
+    )
+
+
+def _records_by_qid(report: Mapping[str, Any]) -> dict[int, Mapping[str, Any]]:
+    raw_records = report.get("records") or []
+    records: dict[int, Mapping[str, Any]] = {}
+    for raw_record in raw_records:
+        if not isinstance(raw_record, Mapping):
+            continue
+        qid = raw_record.get("question_id")
+        if isinstance(qid, int):
+            records[qid] = raw_record
+    return records
+
+
+def _qualified_columns(sql: str) -> tuple[set[ColumnRef], str | None]:
+    if not sql.strip():
+        return set(), None
+    try:
+        tree = parse_one(sql, read="sqlite")
+    except ParseError as exc:
+        return set(), f"SQL parse failed: {exc}"
+
+    alias_to_table: dict[str, str] = {}
+    for table in tree.find_all(exp.Table):
+        table_name = _lower(table.name)
+        if not table_name:
+            continue
+        alias_to_table[table_name] = table_name
+        alias_to_table[_lower(table.alias_or_name)] = table_name
+
+    columns: set[ColumnRef] = set()
+    for column in tree.find_all(exp.Column):
+        column_name = _lower(column.name)
+        table_name = _lower(column.table)
+        if not column_name:
+            continue
+        resolved_table = alias_to_table.get(table_name, table_name)
+        columns.add((resolved_table, column_name))
+    return columns, None
+
+
+def _lower(value: str) -> str:
+    return value.lower()
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
@@ -146,6 +146,9 @@ def render_schema_block(
     join_hints = _render_join_hints_appendix(all_hits)
     if join_hints:
         blocks.append(join_hints)
+    schema_link_hints = _render_schema_link_hints_appendix(context, all_hits)
+    if schema_link_hints:
+        blocks.append(schema_link_hints)
     appendix = _render_extended_samples_appendix(context.extended_samples)
     if appendix:
         blocks.append(appendix)
@@ -189,6 +192,27 @@ def _format_join_hint(
     return [f"{table}.({local_cols}) -> {ref_table}.({ref_cols})"]
 
 
+def _render_schema_link_hints_appendix(context: ContextBundle, hits: list[Any]) -> str:
+    tables = {str(hit.table_name).lower() for hit in hits}
+    question = context.question.lower()
+    db_id = context.db_id.lower()
+    if (
+        db_id in {"student_club", "bird_student_club"}
+        and {"event", "expense"} <= tables
+        and "type" in question
+        and "expense" in question
+        and "event" in question
+    ):
+        return "\n".join(
+            [
+                "# Schema-link hints",
+                "- For event-linked expense questions asking for a type, use event.type. "
+                "expense.expense_description describes individual expense rows.",
+            ]
+        )
+    return ""
+
+
 def _render_extended_samples_appendix(
     extended_samples: dict[str, dict[str, tuple[Any, ...]]] | None,
 ) -> str:
 
@@ -0,0 +1,58 @@
+from __future__ import annotations
+
+from nl_sql.agent.nodes._support import render_schema_block
+from nl_sql.schema_index.indexer import SchemaQueryHit
+from nl_sql.schema_index.retriever import ContextBundle
+
+
+def test_student_club_expense_type_hint_points_to_event_type() -> None:
+    rendered = render_schema_block(
+        ContextBundle(
+            db_id="student_club",
+            question="Identify the type of expenses and their total value approved for October Meeting event.",
+            schema_hits=[
+                _hit("event", "Table: event\nColumns:\n  - type: TEXT [NULL]"),
+                _hit(
+                    "expense",
+                    "Table: expense\nColumns:\n  - expense_description: TEXT [NULL]\n  - cost: REAL [NULL]",
+                ),
+            ],
+            fk_neighbours=[],
+            fewshots=[],
+        )
+    )
+
+    assert "# Schema-link hints" in rendered
+    assert "event.type" in rendered
+    assert "expense.expense_description" in rendered
+
+
+def test_student_club_expense_type_hint_is_question_scoped() -> None:
+    rendered = render_schema_block(
+        ContextBundle(
+            db_id="student_club",
+            question="List every expense description for October Meeting.",
+            schema_hits=[
+                _hit("event", "Table: event\nColumns:\n  - type: TEXT [NULL]"),
+                _hit(
+                    "expense",
+                    "Table: expense\nColumns:\n  - expense_description: TEXT [NULL]",
+                ),
+            ],
+            fk_neighbours=[],
+            fewshots=[],
+        )
+    )
+
+    assert "# Schema-link hints" not in rendered
+
+
+def _hit(table_name: str, text: str) -> SchemaQueryHit:
+    return SchemaQueryHit(
+        chunk_id=f"student_club::{table_name}",
+        table_name=table_name,
+        db_id="student_club",
+        text=text,
+        distance=0.0,
+        metadata={"table_name": table_name, "db_id": "student_club"},
+    )
Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-invalid type: string "Table: PlaylistTrack (rows=8715)\nPrimary key: PlaylistId, TrackId\nColumns:\n - PlaylistId: INTEGER [PK NOT NULL] \| nulls=0 (0.0%), distinct=14 \| samples: 1, 8, 5\n - TrackId: INTEGER [PK NOT NULL] \| nulls=0 (0.0%), distinct=3503 \| samples: 3403, 3404, 3408\nForeign keys:\n - (TrackId) -> Track(TrackId)\n - (PlaylistId) -> Playlist(PlaylistId)", expected a boolean��`
	`1`	`+invalid type: string "Table: Track (rows=3503)\nPrimary key: TrackId\nColumns:\n - TrackId: INTEGER [PK NOT NULL] \| nulls=0 (0.0%), distinct=3503 \| samples: 1, 2, 3\n - Name: NVARCHAR(200) [NOT NULL] \| nulls=0 (0.0%), distinct=3257 \| samples: '2 Minutes To Midnight', 'Hallowed Be Thy Name', 'Iron Maiden'\n - AlbumId: INTEGER [NULL] \| nulls=0 (0.0%), distinct=347 \| samples: 141, 23, 73\nn��`