From 2037fcdf6e25f3d3178317fab818250c8607b29d Mon Sep 17 00:00:00 2001
From: Michael Sitarzewski <msitarzewski@users.noreply.github.com>
Date: Thu, 19 Feb 2026 01:05:58 -0600
Subject: [PATCH 1/3] UX cleanup: collapse defaults, cross-provider
 challengers, truncation detection, PDF fix

- Thread detail: all sections collapsed by default, decision stays open
- Consensus max_tokens bumped 4096 -> 16384 with budget note in system prompts
- Truncation detection: finish_reason checked, truncated flag sent via WebSocket
- Challenger selection prefers cross-provider diversity
- Export dropdown menus use glass styling
- PDF export: add missing bold-italic (BI) TTF font variant

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 memory-bank/activeContext.md                  | 57 +++++---------
 memory-bank/progress.md                       |  1 +
 .../tasks/2026-02/190219_ux-cleanup.md        | 44 +++++++++++
 memory-bank/tasks/2026-02/README.md           | 15 ++++
 src/duh/api/routes/ws.py                      | 12 ++-
 src/duh/cli/app.py                            |  1 +
 src/duh/consensus/handlers.py                 | 75 +++++++++++++++----
 web/src/api/types.ts                          |  2 +
 .../consensus/ConsensusComplete.tsx           |  2 +-
 .../components/consensus/ConsensusPanel.tsx   |  2 +
 .../components/consensus/DissentBanner.tsx    |  4 +-
 web/src/components/consensus/PhaseCard.tsx    | 11 ++-
 web/src/components/shared/ExportMenu.tsx      |  2 +-
 web/src/components/threads/ThreadDetail.tsx   |  4 +-
 web/src/stores/consensus.ts                   | 16 +++-
 15 files changed, 181 insertions(+), 67 deletions(-)
 create mode 100644 memory-bank/tasks/2026-02/190219_ux-cleanup.md

diff --git a/memory-bank/activeContext.md b/memory-bank/activeContext.md
index f21221c..2790c0e 100644
--- a/memory-bank/activeContext.md
+++ b/memory-bank/activeContext.md
@@ -1,45 +1,27 @@
 # Active Context
 
-**Last Updated**: 2026-02-18
-**Current Phase**: Consensus UX — right-side nav, collapsible sections, decision-first layout
-**Next Action**: PR open for review.
+**Last Updated**: 2026-02-19
+**Current Phase**: UX cleanup and consensus engine hardening
+**Next Action**: PR ready for review.
 
-## What Just Shipped: Consensus Navigation & Collapsible Sections
+## What Just Shipped: UX Cleanup + Consensus Engine Improvements
 
-### Core Changes
-The consensus page and thread detail view now have proper navigation and information hierarchy for multi-round deliberations.
+### Thread Detail UX
+- All round sections collapsed by default when thread loads — decision stays open
+- Dissent inside decision block collapsed by default
+- `DissentBanner` gained `defaultOpen` prop for caller control
 
-**Before**: Long vertical scroll of rounds with no way to navigate or collapse. Decision buried at the bottom after all rounds.
-**After**:
-- Sticky right-side nav panel shows progress through rounds/phases
-- All sections are independently collapsible via a shared `Disclosure` primitive
-- Decision surfaces to the **top** when consensus is complete (both live + stored threads)
-- Individual challengers shown by model name in nav and each collapsible
-- Dissent gets equal treatment: collapsible `DissentBanner` with model attribution parsed from `[model:name]:` prefix
+### Consensus Engine Hardening
+- **max_tokens bumped 4096 -> 16384** for propose/challenge/revise phases — prevents LLM output truncation on long responses
+- **Token budget in system prompts** — LLMs now told their output budget so they can self-regulate length and end on complete thoughts
+- **Truncation detection** — `finish_reason` checked after each handler call; `truncated` flag sent via WebSocket; amber warning shown in PhaseCard UI
+- **Cross-provider challenger selection** — `select_challengers()` now prefers models from different providers (one per provider first, then fills). Prevents e.g. Opus proposing + two Sonnet variants challenging (same training biases)
 
-### New Shared Component: `Disclosure`
-Reusable chevron + toggle primitive (`web/src/components/shared/Disclosure.tsx`):
-- Props: `header`, `defaultOpen`, `forceOpen`, `className`
-- Used by: PhaseCard, TurnCard, ConsensusComplete, DissentBanner, ThreadDetail
+### Visual Polish
+- Export dropdown menus (both `ConsensusComplete` and `ExportMenu`) now use glass styling matching the design system (`glass-bg` + `backdrop-blur`)
 
-### Files Changed (17 files)
-**New files:**
-- `web/src/components/shared/Disclosure.tsx` — Shared collapsible primitive
-- `web/src/components/consensus/ConsensusNav.tsx` — Sticky nav for live consensus
-- `web/src/components/threads/ThreadNav.tsx` — Sticky nav for thread detail
-- `web/src/__tests__/consensus-nav.test.tsx` — 32 tests (Disclosure, PhaseCard, DissentBanner, TurnCard, ConsensusNav)
-- `web/src/__tests__/thread-nav.test.tsx` — 8 tests (ThreadNav)
-
-**Modified:**
-- `PhaseCard.tsx` — Uses Disclosure for outer collapse + per-challenger Disclosure
-- `TurnCard.tsx` — Uses Disclosure for outer collapse + per-contribution Disclosure
-- `ConsensusComplete.tsx` — Collapsible via Disclosure, dissent moved inside panel
-- `DissentBanner.tsx` — Uses Disclosure, parses `[model:name]:` prefix for ModelBadge
-- `ConsensusPanel.tsx` — Decision at top when complete, scroll target IDs
-- `ConsensusPage.tsx` — Flex-row layout with sticky ConsensusNav sidebar
-- `ThreadDetail.tsx` — Decision surfaced to top, DissentBanner for dissent, scroll IDs
-- `ThreadDetailPage.tsx` — Flex-row layout with sticky ThreadNav sidebar
-- Barrel exports: `consensus/index.ts`, `threads/index.ts`, `shared/index.ts`
+### PDF Export Bug Fix
+- `_setup_fonts()` was missing the bold-italic (`BI`) TTF font variant — caused crash when dissent content contained bold markdown rendered in italic context
 
 ### Test Results
 - 1586 Python tests + 166 Vitest tests (1752 total)
@@ -49,10 +31,9 @@ Reusable chevron + toggle primitive (`web/src/components/shared/Disclosure.tsx`)
 
 ## Current State
 
-- **Branch `consensus-nav-collapsible`** — ready for PR.
+- **Branch `ux-cleanup`** — ready for PR.
 - **1586 Python tests + 166 Vitest tests** (1752 total).
-- **~62 Python source files + 75 frontend source files** (~137 total).
-- All previous features intact (v0.1–v0.5 + export + epistemic confidence).
+- All previous features intact (v0.1–v0.5 + export + epistemic confidence + consensus nav).
 
 ## Open Questions (Still Unresolved)
 
diff --git a/memory-bank/progress.md b/memory-bank/progress.md
index 2381039..2dd8c67 100644
--- a/memory-bank/progress.md
+++ b/memory-bank/progress.md
@@ -181,3 +181,4 @@ Phase 0 benchmark framework — fully functional, pilot-tested on 5 questions.
 | 2026-02-17 | Export to Markdown & PDF (CLI + API + Web UI) | Done |
 | 2026-02-18 | Epistemic Confidence Phase A (rigor + domain caps + calibration) | Done |
 | 2026-02-18 | Consensus nav + collapsible sections + decision-first layout | Done |
+| 2026-02-19 | UX cleanup: collapse defaults, max_tokens 16384, cross-provider challengers, truncation detection, glass exports, PDF BI font fix | Done |
diff --git a/memory-bank/tasks/2026-02/190219_ux-cleanup.md b/memory-bank/tasks/2026-02/190219_ux-cleanup.md
new file mode 100644
index 0000000..0d0be8d
--- /dev/null
+++ b/memory-bank/tasks/2026-02/190219_ux-cleanup.md
@@ -0,0 +1,44 @@
+# 190219_ux-cleanup
+
+## Objective
+UX polish and bug fixes: thread detail collapse defaults, consensus engine improvements (token limits, cross-provider challengers, truncation detection), export menu glass styling, PDF export crash fix.
+
+## Outcome
+- All thread sections collapsed by default except decision (with dissent)
+- Consensus `max_tokens` bumped 4096 -> 16384 for propose/challenge/revise
+- Token budget communicated to LLMs in system prompts to prevent truncation
+- Truncation detection: `finish_reason` checked after each phase, `truncated` flag sent via WebSocket, amber warning shown in PhaseCard UI
+- Challenger selection prefers cross-provider diversity (one per provider first, then fill)
+- Export dropdown menus use glass styling (`glass-bg` + `backdrop-blur`)
+- PDF export crash fixed: missing bold-italic (`BI`) TTF font variant
+- All 1586 Python + 166 Vitest tests pass
+
+## Files Modified
+
+### Backend
+- `src/duh/consensus/handlers.py` — `max_tokens` 4096->16384; `_token_budget_note()` helper appended to all system prompts; `select_challengers()` rewritten for cross-provider diversity (prefers one model per different provider, then fills same-provider, then self-ensemble)
+- `src/duh/api/routes/ws.py` — Captures `ModelResponse` from propose/challenge/revise handlers; sends `truncated` boolean in `phase_complete` and `challenge` WebSocket events
+- `src/duh/cli/app.py` — Added `self.add_font("DuhSans", "BI", path)` to fix bold-italic crash in PDF export
+
+### Frontend
+- `web/src/components/threads/ThreadDetail.tsx` — All rounds `defaultOpen={false}`; dissent in decision block `defaultOpen={false}`
+- `web/src/components/consensus/DissentBanner.tsx` — Added `defaultOpen` prop (defaults `true` for backward compat)
+- `web/src/components/consensus/PhaseCard.tsx` — Added `truncated` prop; renders amber "Output truncated" warning when content hit token limit; `challenges` type updated to include `truncated` field
+- `web/src/components/consensus/ConsensusPanel.tsx` — Passes `truncated` flag from round data to PROPOSE and REVISE PhaseCards
+- `web/src/components/consensus/ConsensusComplete.tsx` — Export dropdown uses glass styling
+- `web/src/components/shared/ExportMenu.tsx` — Export dropdown uses glass styling
+- `web/src/stores/consensus.ts` — Added `truncated: string[]` to `RoundData`; `ChallengeEntry` gains `truncated` field; `handleEvent` tracks truncation per phase
+- `web/src/api/types.ts` — Added `truncated?: boolean` to `WSPhaseComplete` and `WSChallenge`
+
+## Patterns Applied
+- `systemPatterns.md#Disclosure` — reused for DissentBanner defaultOpen prop
+- Cross-provider challenger selection follows existing `select_challengers` pattern but adds provider diversity layer
+- Token budget note follows existing `_grounding_prefix()` pattern for system prompt composition
+
+## Architectural Decisions
+- **Token budget in system prompt**: LLMs don't know their `max_tokens` limit. Adding budget instruction in system prompt lets models self-regulate output length. Not a guarantee (models can't count tokens precisely), but dramatically reduces truncation.
+- **Cross-provider challengers**: Prefers models from different providers for genuine intellectual diversity. Same-provider models may share training data biases, reducing challenge quality.
+- **16384 max_tokens**: 4x increase from 4096. Balances thorough responses against cost (output tokens dominate cost for expensive models).
+
+## Artifacts
+- Branch: `ux-cleanup`
diff --git a/memory-bank/tasks/2026-02/README.md b/memory-bank/tasks/2026-02/README.md
index 9850c2a..d4dfc59 100644
--- a/memory-bank/tasks/2026-02/README.md
+++ b/memory-bank/tasks/2026-02/README.md
@@ -499,3 +499,18 @@
 - Frontend: CalibrationDashboard (metric cards + bar chart + bucket table), CalibrationPage, calibration Zustand store
 - Tests: 15 calibration tests, 20 confidence scoring tests, 4 CLI calibration tests
 - **Total: 1586 Python + 126 Vitest = 1712 tests**
+
+---
+
+## UX Cleanup + Consensus Engine Improvements
+
+### 2026-02-19: UX Cleanup
+- Thread detail: all sections collapsed by default except decision (with dissent)
+- `DissentBanner` gained `defaultOpen` prop
+- Export dropdown menus use glass styling (`glass-bg` + `backdrop-blur`)
+- PDF export crash fix: missing bold-italic (`BI`) TTF font variant in `_setup_fonts()`
+- `max_tokens` bumped 4096 -> 16384 for propose/challenge/revise
+- Token budget communicated to LLMs in system prompts via `_token_budget_note()`
+- Truncation detection: `finish_reason` checked, `truncated` flag sent via WebSocket, amber warning in PhaseCard
+- Cross-provider challenger selection: prefers one model per different provider for diversity
+- See: [190219_ux-cleanup.md](./190219_ux-cleanup.md)
diff --git a/src/duh/api/routes/ws.py b/src/duh/api/routes/ws.py
index 36ff8ff..8635294 100644
--- a/src/duh/api/routes/ws.py
+++ b/src/duh/api/routes/ws.py
@@ -131,12 +131,13 @@ async def _stream_consensus(
                 "round": ctx.current_round,
             }
         )
-        await handle_propose(ctx, pm, proposer)
+        propose_resp = await handle_propose(ctx, pm, proposer)
         await ws.send_json(
             {
                 "type": "phase_complete",
                 "phase": "PROPOSE",
                 "content": ctx.proposal or "",
+                "truncated": propose_resp.finish_reason != "stop",
             }
         )
 
@@ -153,13 +154,15 @@ async def _stream_consensus(
                 "round": ctx.current_round,
             }
         )
-        await handle_challenge(ctx, pm, challengers)
-        for ch in ctx.challenges:
+        challenge_resps = await handle_challenge(ctx, pm, challengers)
+        for i, ch in enumerate(ctx.challenges):
+            truncated = i < len(challenge_resps) and challenge_resps[i].finish_reason != "stop"
             await ws.send_json(
                 {
                     "type": "challenge",
                     "model": ch.model_ref,
                     "content": ch.content,
+                    "truncated": truncated,
                 }
             )
         await ws.send_json({"type": "phase_complete", "phase": "CHALLENGE"})
@@ -175,12 +178,13 @@ async def _stream_consensus(
                 "round": ctx.current_round,
             }
         )
-        await handle_revise(ctx, pm)
+        revise_resp = await handle_revise(ctx, pm)
         await ws.send_json(
             {
                 "type": "phase_complete",
                 "phase": "REVISE",
                 "content": ctx.revision or "",
+                "truncated": revise_resp.finish_reason != "stop",
             }
         )
 
diff --git a/src/duh/cli/app.py b/src/duh/cli/app.py
index 56ddc91..b3c9ea3 100644
--- a/src/duh/cli/app.py
+++ b/src/duh/cli/app.py
@@ -1307,6 +1307,7 @@ def _setup_fonts(self) -> None:
                         self.add_font("DuhSans", "", path)
                         self.add_font("DuhSans", "B", path)
                         self.add_font("DuhSans", "I", path)
+                        self.add_font("DuhSans", "BI", path)
                         self._use_ttf = True
                         self._font_family = "DuhSans"
                         break
diff --git a/src/duh/consensus/handlers.py b/src/duh/consensus/handlers.py
index 6dde013..4f91935 100644
--- a/src/duh/consensus/handlers.py
+++ b/src/duh/consensus/handlers.py
@@ -149,17 +149,29 @@ def _grounding_prefix() -> str:
     return f"Today's date is {today}. {_GROUNDING}"
 
 
+def _token_budget_note(max_tokens: int) -> str:
+    """Instruction telling the model its output token budget."""
+    return (
+        f"\n\nYour response budget is approximately {max_tokens:,} tokens. "
+        "Structure your answer to fit within this budget — be thorough but "
+        "concise. If the topic requires extensive detail, prioritize the most "
+        "important points and ensure your response ends with a complete thought."
+    )
+
+
 # ── Prompt building ───────────────────────────────────────────
 
 
-def build_propose_prompt(ctx: ConsensusContext) -> list[PromptMessage]:
+def build_propose_prompt(
+    ctx: ConsensusContext, *, max_tokens: int = 16384
+) -> list[PromptMessage]:
     """Build prompt messages for the PROPOSE phase.
 
     Round 1: system prompt + question.
     Round > 1: system prompt + question + previous round context
     (decision and challenges) so the proposer can improve.
     """
-    system = f"{_grounding_prefix()}\n\n{_PROPOSER_SYSTEM}"
+    system = f"{_grounding_prefix()}\n\n{_PROPOSER_SYSTEM}{_token_budget_note(max_tokens)}"
 
     if ctx.current_round <= 1 or not ctx.round_history:
         user_content = ctx.question
@@ -243,7 +255,7 @@ async def handle_propose(
     model_ref: str,
     *,
     temperature: float = 0.7,
-    max_tokens: int = 4096,
+    max_tokens: int = 16384,
     tool_registry: ToolRegistry | None = None,
 ) -> ModelResponse:
     """Execute the PROPOSE phase of consensus.
@@ -279,7 +291,7 @@ async def handle_propose(
         msg = f"handle_propose requires PROPOSE state, got {ctx.state.value}"
         raise ConsensusError(msg)
 
-    messages = build_propose_prompt(ctx)
+    messages = build_propose_prompt(ctx, max_tokens=max_tokens)
     provider, model_id = provider_manager.get_provider(model_ref)
 
     if tool_registry is not None:
@@ -316,6 +328,8 @@ async def handle_propose(
 def build_challenge_prompt(
     ctx: ConsensusContext,
     framing: str = "flaw",
+    *,
+    max_tokens: int = 16384,
 ) -> list[PromptMessage]:
     """Build prompt messages for the CHALLENGE phase.
 
@@ -325,9 +339,10 @@ def build_challenge_prompt(
     Args:
         ctx: Consensus context with the proposal to challenge.
         framing: One of the challenge framing types.
+        max_tokens: Token budget communicated to the model.
     """
     system_text = _CHALLENGE_FRAMINGS.get(framing, _CHALLENGE_FRAMINGS["flaw"])
-    system = f"{_grounding_prefix()}\n\n{system_text}"
+    system = f"{_grounding_prefix()}\n\n{system_text}{_token_budget_note(max_tokens)}"
     user_content = (
         f"Question: {ctx.question}\n\n"
         f"Answer from another expert (do NOT defer to this -- challenge it):\n"
@@ -374,13 +389,43 @@ def select_challengers(
             msg = "No panel models available for challenge"
             raise InsufficientModelsError(msg)
 
-    others = sorted(
-        (m for m in models if m.model_ref != proposer_model),
+    proposer_provider = proposer_model.split(":")[0]
+
+    others = [m for m in models if m.model_ref != proposer_model]
+
+    # Prefer models from different providers for true cross-provider challenge
+    cross_provider = sorted(
+        (m for m in others if m.provider_id != proposer_provider),
+        key=lambda m: m.output_cost_per_mtok,
+        reverse=True,
+    )
+    same_provider = sorted(
+        (m for m in others if m.provider_id == proposer_provider),
         key=lambda m: m.output_cost_per_mtok,
         reverse=True,
     )
 
-    selected = [m.model_ref for m in others[:count]]
+    # Pick cross-provider first, then fill with same-provider
+    selected: list[str] = []
+    used_providers: set[str] = set()
+    for m in cross_provider:
+        if len(selected) >= count:
+            break
+        # Prefer one model per provider for maximum diversity
+        if m.provider_id not in used_providers:
+            selected.append(m.model_ref)
+            used_providers.add(m.provider_id)
+    # If still not enough, add remaining cross-provider models
+    for m in cross_provider:
+        if len(selected) >= count:
+            break
+        if m.model_ref not in selected:
+            selected.append(m.model_ref)
+    # Then same-provider models
+    for m in same_provider:
+        if len(selected) >= count:
+            break
+        selected.append(m.model_ref)
     # Fill remaining slots with proposer (same-model ensemble)
     while len(selected) < count:
         selected.append(proposer_model)
@@ -415,7 +460,7 @@ async def _call_challenger(
 
     Returns (model_ref, framing, response).
     """
-    messages = build_challenge_prompt(ctx, framing=framing)
+    messages = build_challenge_prompt(ctx, framing=framing, max_tokens=max_tokens)
     provider, model_id = provider_manager.get_provider(model_ref)
 
     if tool_registry is not None:
@@ -446,7 +491,7 @@ async def handle_challenge(
     challenger_models: list[str],
     *,
     temperature: float = 0.7,
-    max_tokens: int = 4096,
+    max_tokens: int = 16384,
     tool_registry: ToolRegistry | None = None,
 ) -> list[ModelResponse]:
     """Execute the CHALLENGE phase of consensus.
@@ -527,14 +572,16 @@ async def handle_challenge(
 # ── REVISE prompt + handler ───────────────────────────────────
 
 
-def build_revise_prompt(ctx: ConsensusContext) -> list[PromptMessage]:
+def build_revise_prompt(
+    ctx: ConsensusContext, *, max_tokens: int = 16384
+) -> list[PromptMessage]:
     """Build prompt messages for the REVISE phase.
 
     System prompt instructs the reviser to address challenges.
     User prompt includes the question, original proposal, and all
     challenges so the revision addresses each one.
     """
-    system = f"{_grounding_prefix()}\n\n{_REVISER_SYSTEM}"
+    system = f"{_grounding_prefix()}\n\n{_REVISER_SYSTEM}{_token_budget_note(max_tokens)}"
 
     challenges_text = "\n\n".join(
         f"Challenge from {c.model_ref}:\n{c.content}" for c in ctx.challenges
@@ -557,7 +604,7 @@ async def handle_revise(
     model_ref: str | None = None,
     *,
     temperature: float = 0.7,
-    max_tokens: int = 4096,
+    max_tokens: int = 16384,
 ) -> ModelResponse:
     """Execute the REVISE phase of consensus.
 
@@ -604,7 +651,7 @@ async def handle_revise(
         msg = "handle_revise requires a model_ref or proposal_model"
         raise ConsensusError(msg)
 
-    messages = build_revise_prompt(ctx)
+    messages = build_revise_prompt(ctx, max_tokens=max_tokens)
     provider, model_id = provider_manager.get_provider(reviser_ref)
 
     response = await provider.send(
diff --git a/web/src/api/types.ts b/web/src/api/types.ts
index 26ed5d6..0963a8f 100644
--- a/web/src/api/types.ts
+++ b/web/src/api/types.ts
@@ -197,12 +197,14 @@ export interface WSPhaseComplete {
   type: 'phase_complete'
   phase: ConsensusPhase
   content?: string
+  truncated?: boolean
 }
 
 export interface WSChallenge {
   type: 'challenge'
   model: string
   content: string
+  truncated?: boolean
 }
 
 export interface WSCommit {
diff --git a/web/src/components/consensus/ConsensusComplete.tsx b/web/src/components/consensus/ConsensusComplete.tsx
index 5abf6a0..b0dd297 100644
--- a/web/src/components/consensus/ConsensusComplete.tsx
+++ b/web/src/components/consensus/ConsensusComplete.tsx
@@ -140,7 +140,7 @@ export function ConsensusComplete({ decision, confidence, rigor, dissent, cost,
             Export
           </GlowButton>
           {exportOpen && (
-            <div className="absolute bottom-full left-0 mb-1 bg-[var(--color-bg-secondary)] border border-[var(--color-border)] rounded-lg shadow-lg py-1 min-w-[200px] z-10">
+            <div className="absolute bottom-full left-0 mb-1 bg-[var(--glass-bg)] backdrop-blur-[var(--glass-blur)] border border-[var(--color-border)] rounded-[var(--radius-md)] shadow-lg py-1 min-w-[200px] z-50">
               <button
                 className="w-full text-left px-3 py-1.5 text-xs hover:bg-[var(--color-bg-tertiary)] text-[var(--color-text)]"
                 onClick={() => handleExportMarkdown('decision')}
diff --git a/web/src/components/consensus/ConsensusPanel.tsx b/web/src/components/consensus/ConsensusPanel.tsx
index baac70c..13ff2c3 100644
--- a/web/src/components/consensus/ConsensusPanel.tsx
+++ b/web/src/components/consensus/ConsensusPanel.tsx
@@ -69,6 +69,7 @@ export function ConsensusPanel() {
                     isActive={isActive && currentPhase === 'PROPOSE' && round.round === currentRound}
                     collapsible={isCompletedRound}
                     defaultOpen={false}
+                    truncated={round.truncated.includes('PROPOSE')}
                   />
                 )}
 
@@ -91,6 +92,7 @@ export function ConsensusPanel() {
                     isActive={isActive && currentPhase === 'REVISE' && round.round === currentRound}
                     collapsible={isCompletedRound}
                     defaultOpen={false}
+                    truncated={round.truncated.includes('REVISE')}
                   />
                 )}
 
diff --git a/web/src/components/consensus/DissentBanner.tsx b/web/src/components/consensus/DissentBanner.tsx
index 20a9304..83f08a8 100644
--- a/web/src/components/consensus/DissentBanner.tsx
+++ b/web/src/components/consensus/DissentBanner.tsx
@@ -9,7 +9,7 @@ function parseModelFromDissent(dissent: string): { model: string | null; content
   return { model: null, content: dissent }
 }
 
-export function DissentBanner({ dissent }: { dissent: string }) {
+export function DissentBanner({ dissent, defaultOpen = true }: { dissent: string; defaultOpen?: boolean }) {
   const { model, content } = parseModelFromDissent(dissent)
 
   return (
@@ -21,7 +21,7 @@ export function DissentBanner({ dissent }: { dissent: string }) {
             {model && <ModelBadge model={model} />}
           </>
         }
-        defaultOpen
+        defaultOpen={defaultOpen}
       >
         <div className="text-sm text-[var(--color-text-secondary)]">
           <Markdown>{content}</Markdown>
diff --git a/web/src/components/consensus/PhaseCard.tsx b/web/src/components/consensus/PhaseCard.tsx
index a1e438c..95cda12 100644
--- a/web/src/components/consensus/PhaseCard.tsx
+++ b/web/src/components/consensus/PhaseCard.tsx
@@ -8,12 +8,13 @@ interface PhaseCardProps {
   models?: string[]
   content?: string | null
   isActive?: boolean
-  challenges?: Array<{ model: string; content: string }>
+  challenges?: Array<{ model: string; content: string; truncated?: boolean }>
   collapsible?: boolean
   defaultOpen?: boolean
+  truncated?: boolean
 }
 
-export function PhaseCard({ phase, model, models, content, isActive, challenges, collapsible, defaultOpen = true }: PhaseCardProps) {
+export function PhaseCard({ phase, model, models, content, isActive, challenges, collapsible, defaultOpen = true, truncated }: PhaseCardProps) {
   const header = (
     <>
       <span className="font-mono text-xs text-[var(--color-primary)] font-semibold">{phase}</span>
@@ -54,6 +55,12 @@ export function PhaseCard({ phase, model, models, content, isActive, challenges,
         </div>
       )}
 
+      {(truncated || challenges?.some((ch) => ch.truncated)) && (
+        <p className="text-[10px] font-mono text-[var(--color-amber)] mt-2">
+          Output truncated — response hit token limit
+        </p>
+      )}
+
       {isActive && !content && !challenges?.length && (
         <div className="flex items-center gap-2 text-[var(--color-text-dim)] text-xs font-mono">
           <svg className="animate-spin h-3 w-3" viewBox="0 0 24 24" fill="none">
diff --git a/web/src/components/shared/ExportMenu.tsx b/web/src/components/shared/ExportMenu.tsx
index b63469b..0f1cf6f 100644
--- a/web/src/components/shared/ExportMenu.tsx
+++ b/web/src/components/shared/ExportMenu.tsx
@@ -148,7 +148,7 @@ export function ExportMenu({ thread }: ExportMenuProps) {
         {downloading ? 'Exporting...' : 'Export'}
       </GlowButton>
       {open && (
-        <div className="absolute top-full right-0 mt-1 bg-[var(--color-bg)] border border-[var(--color-border)] rounded-lg shadow-lg py-1 min-w-[200px] z-50">
+        <div className="absolute top-full right-0 mt-1 bg-[var(--glass-bg)] backdrop-blur-[var(--glass-blur)] border border-[var(--color-border)] rounded-[var(--radius-md)] shadow-lg py-1 min-w-[200px] z-50">
           <button
             className="w-full text-left px-3 py-1.5 text-xs hover:bg-[var(--color-bg-tertiary)] text-[var(--color-text)]"
             onClick={() => handleMarkdown('decision')}
diff --git a/web/src/components/threads/ThreadDetail.tsx b/web/src/components/threads/ThreadDetail.tsx
index 4fc9e8c..41a15a4 100644
--- a/web/src/components/threads/ThreadDetail.tsx
+++ b/web/src/components/threads/ThreadDetail.tsx
@@ -100,7 +100,7 @@ export function ThreadDetail() {
               </div>
               {finalDecision.dissent && (
                 <div className="mt-4">
-                  <DissentBanner dissent={finalDecision.dissent} />
+                  <DissentBanner dissent={finalDecision.dissent} defaultOpen={false} />
                 </div>
               )}
             </Disclosure>
@@ -113,7 +113,7 @@ export function ThreadDetail() {
           <TurnCard
             turn={turn}
             collapsible={currentThread.turns.length > 1}
-            defaultOpen={!finalDecision && i === currentThread.turns.length - 1}
+            defaultOpen={false}
           />
         </div>
       ))}
diff --git a/web/src/stores/consensus.ts b/web/src/stores/consensus.ts
index 3c2607a..5ecfd4f 100644
--- a/web/src/stores/consensus.ts
+++ b/web/src/stores/consensus.ts
@@ -12,6 +12,7 @@ export type ConsensusStatus = 'idle' | 'connecting' | 'streaming' | 'complete' |
 export interface ChallengeEntry {
   model: string
   content: string
+  truncated?: boolean
 }
 
 export interface RoundData {
@@ -25,6 +26,7 @@ export interface RoundData {
   confidence: number | null
   rigor: number | null
   dissent: string | null
+  truncated: string[]
 }
 
 interface ConsensusState {
@@ -68,6 +70,7 @@ function createEmptyRound(round: number): RoundData {
     confidence: null,
     rigor: null,
     dissent: null,
+    truncated: [],
   }
 }
 
@@ -193,8 +196,13 @@ function handleEvent(
       const [round, idx] = found
 
       const update: Partial<RoundData> = {}
-      if (event.phase === 'PROPOSE') update.proposal = event.content ?? null
-      else if (event.phase === 'REVISE') update.revision = event.content ?? null
+      if (event.phase === 'PROPOSE') {
+        update.proposal = event.content ?? null
+        if (event.truncated) update.truncated = [...round.truncated, 'PROPOSE']
+      } else if (event.phase === 'REVISE') {
+        update.revision = event.content ?? null
+        if (event.truncated) update.truncated = [...round.truncated, 'REVISE']
+      }
 
       set({ rounds: updateRound(state.rounds, idx, { ...round, ...update }) })
       break
@@ -205,9 +213,11 @@ function handleEvent(
       if (!found) break
       const [round, idx] = found
 
+      const truncatedUpdate = event.truncated ? [...round.truncated, `CHALLENGE:${event.model}`] : round.truncated
       set({
         rounds: updateRound(state.rounds, idx, {
-          challenges: [...round.challenges, { model: event.model, content: event.content }],
+          challenges: [...round.challenges, { model: event.model, content: event.content, truncated: event.truncated }],
+          truncated: truncatedUpdate,
         }),
       })
       break

From 3790edda92e68703cf4ac80cc2cccbe735c916df Mon Sep 17 00:00:00 2001
From: Michael Sitarzewski <msitarzewski@users.noreply.github.com>
Date: Thu, 19 Feb 2026 01:20:22 -0600
Subject: [PATCH 2/3] Fix ruff E501 line-too-long errors

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 src/duh/api/routes/ws.py      | 7 +++++--
 src/duh/consensus/handlers.py | 6 ++++--
 2 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/src/duh/api/routes/ws.py b/src/duh/api/routes/ws.py
index 8635294..805e543 100644
--- a/src/duh/api/routes/ws.py
+++ b/src/duh/api/routes/ws.py
@@ -156,13 +156,16 @@ async def _stream_consensus(
         )
         challenge_resps = await handle_challenge(ctx, pm, challengers)
         for i, ch in enumerate(ctx.challenges):
-            truncated = i < len(challenge_resps) and challenge_resps[i].finish_reason != "stop"
+            resp_truncated = (
+                i < len(challenge_resps)
+                and challenge_resps[i].finish_reason != "stop"
+            )
             await ws.send_json(
                 {
                     "type": "challenge",
                     "model": ch.model_ref,
                     "content": ch.content,
-                    "truncated": truncated,
+                    "truncated": resp_truncated,
                 }
             )
         await ws.send_json({"type": "phase_complete", "phase": "CHALLENGE"})
diff --git a/src/duh/consensus/handlers.py b/src/duh/consensus/handlers.py
index 4f91935..aef2150 100644
--- a/src/duh/consensus/handlers.py
+++ b/src/duh/consensus/handlers.py
@@ -171,7 +171,8 @@ def build_propose_prompt(
     Round > 1: system prompt + question + previous round context
     (decision and challenges) so the proposer can improve.
     """
-    system = f"{_grounding_prefix()}\n\n{_PROPOSER_SYSTEM}{_token_budget_note(max_tokens)}"
+    budget = _token_budget_note(max_tokens)
+    system = f"{_grounding_prefix()}\n\n{_PROPOSER_SYSTEM}{budget}"
 
     if ctx.current_round <= 1 or not ctx.round_history:
         user_content = ctx.question
@@ -581,7 +582,8 @@ def build_revise_prompt(
     User prompt includes the question, original proposal, and all
     challenges so the revision addresses each one.
     """
-    system = f"{_grounding_prefix()}\n\n{_REVISER_SYSTEM}{_token_budget_note(max_tokens)}"
+    budget = _token_budget_note(max_tokens)
+    system = f"{_grounding_prefix()}\n\n{_REVISER_SYSTEM}{budget}"
 
     challenges_text = "\n\n".join(
         f"Challenge from {c.model_ref}:\n{c.content}" for c in ctx.challenges

From f0c84af024a3ae09c5fbf5de86671db34a30d9a3 Mon Sep 17 00:00:00 2001
From: Michael Sitarzewski <msitarzewski@users.noreply.github.com>
Date: Thu, 19 Feb 2026 01:28:45 -0600
Subject: [PATCH 3/3] Apply ruff formatting to ws.py

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 src/duh/api/routes/ws.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/duh/api/routes/ws.py b/src/duh/api/routes/ws.py
index 805e543..39a5b50 100644
--- a/src/duh/api/routes/ws.py
+++ b/src/duh/api/routes/ws.py
@@ -157,8 +157,7 @@ async def _stream_consensus(
         challenge_resps = await handle_challenge(ctx, pm, challengers)
         for i, ch in enumerate(ctx.challenges):
             resp_truncated = (
-                i < len(challenge_resps)
-                and challenge_resps[i].finish_reason != "stop"
+                i < len(challenge_resps) and challenge_resps[i].finish_reason != "stop"
             )
             await ws.send_json(
                 {